diff --git "a/wandb/run-20220228_223243-2ay2wvge/files/wandb-summary.json" "b/wandb/run-20220228_223243-2ay2wvge/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220228_223243-2ay2wvge/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.9575, "train/learning_rate": 9.920000000000002e-06, "train/epoch": 0.49, "train/global_step": 500, "_runtime": 2346, "_timestamp": 1646089909, "_step": 499, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 22.0, 439.0, 516.0, 37.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.76547622680664, -38.26892852783203, -30.772380828857422, -23.275835037231445, -15.779287338256836, -8.28274154663086, -0.78619384765625, 6.710353851318359, 14.206901550292969, 21.703449249267578, 29.199996948242188, 36.69654083251953, 44.193092346191406, 51.68963623046875, 59.18618392944336, 66.68273162841797, 74.17927551269531, 81.67581939697266, 89.17237091064453, 96.66891479492188, 104.16546630859375, 111.6620101928711, 119.15855407714844, 126.65510559082031, 134.1516571044922, 141.64820861816406, 149.14474487304688, 156.64129638671875, 164.13784790039062, 171.6343994140625, 179.1309356689453, 186.6274871826172, 194.12403869628906, 201.62059020996094, 209.11712646484375, 216.61367797851562, 224.1102294921875, 231.60678100585938, 239.1033172607422, 246.59986877441406, 254.09642028808594, 261.59295654296875, 269.0895080566406, 276.5860595703125, 284.0826110839844, 291.57916259765625, 299.0757141113281, 306.572265625, 314.06878662109375, 321.5653381347656, 329.0618896484375, 336.5584411621094, 344.0549621582031, 351.551513671875, 359.0480651855469, 366.54461669921875, 374.0411682128906, 381.5377197265625, 389.0342712402344, 396.53082275390625, 404.02734375, 411.5238952636719, 419.02044677734375, 426.5169982910156, 434.0135498046875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 4.0, 10.0, 6.0, 8.0, 11.0, 16.0, 23.0, 26.0, 25.0, 31.0, 33.0, 48.0, 43.0, 50.0, 56.0, 47.0, 53.0, 59.0, 46.0, 51.0, 52.0, 43.0, 47.0, 43.0, 38.0, 17.0, 25.0, 27.0, 21.0, 10.0, 8.0, 8.0, 6.0, 10.0, 2.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-76.76583862304688, -74.85212707519531, -72.93841552734375, -71.02470397949219, -69.11099243164062, -67.1972885131836, -65.28357696533203, -63.36986541748047, -61.456153869628906, -59.542442321777344, -57.62873077392578, -55.715023040771484, -53.80131149291992, -51.88759994506836, -49.97389221191406, -48.0601806640625, -46.14646911621094, -44.232757568359375, -42.31904602050781, -40.405338287353516, -38.49162673950195, -36.57791519165039, -34.664207458496094, -32.75049591064453, -30.83678436279297, -28.923072814941406, -27.009363174438477, -25.095653533935547, -23.181941986083984, -21.268230438232422, -19.354520797729492, -17.440811157226562, -15.527099609375, -13.613389015197754, -11.699678421020508, -9.785967826843262, -7.872257232666016, -5.9585466384887695, -4.044836044311523, -2.1311254501342773, -0.21741485595703125, 1.6962957382202148, 3.610006332397461, 5.523716926574707, 7.437427520751953, 9.3511381149292, 11.264848709106445, 13.178559303283691, 15.092269897460938, 17.0059814453125, 18.91969108581543, 20.83340072631836, 22.747112274169922, 24.660823822021484, 26.574533462524414, 28.488243103027344, 30.401954650878906, 32.31566619873047, 34.22937774658203, 36.14308547973633, 38.05679702758789, 39.97050857543945, 41.88421630859375, 43.79792785644531, 45.711639404296875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 6.0, 9.0, 12.0, 9.0, 11.0, 13.0, 19.0, 15.0, 22.0, 20.0, 33.0, 32.0, 29.0, 33.0, 53.0, 45.0, 43.0, 43.0, 62.0, 60.0, 55.0, 51.0, 42.0, 41.0, 46.0, 34.0, 30.0, 17.0, 26.0, 17.0, 17.0, 11.0, 13.0, 12.0, 4.0, 6.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.779296875, -2.656707763671875, -2.53411865234375, -2.411529541015625, -2.2889404296875, -2.166351318359375, -2.04376220703125, -1.921173095703125, -1.798583984375, -1.675994873046875, -1.55340576171875, -1.430816650390625, -1.3082275390625, -1.185638427734375, -1.06304931640625, -0.940460205078125, -0.81787109375, -0.695281982421875, -0.57269287109375, -0.450103759765625, -0.3275146484375, -0.204925537109375, -0.08233642578125, 0.040252685546875, 0.162841796875, 0.285430908203125, 0.40802001953125, 0.530609130859375, 0.6531982421875, 0.775787353515625, 0.89837646484375, 1.020965576171875, 1.1435546875, 1.266143798828125, 1.38873291015625, 1.511322021484375, 1.6339111328125, 1.756500244140625, 1.87908935546875, 2.001678466796875, 2.124267578125, 2.246856689453125, 2.36944580078125, 2.492034912109375, 2.6146240234375, 2.737213134765625, 2.85980224609375, 2.982391357421875, 3.10498046875, 3.227569580078125, 3.35015869140625, 3.472747802734375, 3.5953369140625, 3.717926025390625, 3.84051513671875, 3.963104248046875, 4.085693359375, 4.208282470703125, 4.33087158203125, 4.453460693359375, 4.5760498046875, 4.698638916015625, 4.82122802734375, 4.943817138671875, 5.06640625]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 13.0, 8.0, 13.0, 19.0, 36.0, 53.0, 80.0, 99.0, 139.0, 197.0, 277.0, 399.0, 642.0, 1084.0, 1842.0, 3964.0, 9748.0, 33195.0, 215431.0, 2173143.0, 1573533.0, 139899.0, 25074.0, 7771.0, 3241.0, 1705.0, 969.0, 560.0, 347.0, 237.0, 144.0, 121.0, 80.0, 58.0, 48.0, 32.0, 28.0, 11.0, 17.0, 9.0, 5.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.1171875, -8.7783203125, -8.439453125, -8.1005859375, -7.76171875, -7.4228515625, -7.083984375, -6.7451171875, -6.40625, -6.0673828125, -5.728515625, -5.3896484375, -5.05078125, -4.7119140625, -4.373046875, -4.0341796875, -3.6953125, -3.3564453125, -3.017578125, -2.6787109375, -2.33984375, -2.0009765625, -1.662109375, -1.3232421875, -0.984375, -0.6455078125, -0.306640625, 0.0322265625, 0.37109375, 0.7099609375, 1.048828125, 1.3876953125, 1.7265625, 2.0654296875, 2.404296875, 2.7431640625, 3.08203125, 3.4208984375, 3.759765625, 4.0986328125, 4.4375, 4.7763671875, 5.115234375, 5.4541015625, 5.79296875, 6.1318359375, 6.470703125, 6.8095703125, 7.1484375, 7.4873046875, 7.826171875, 8.1650390625, 8.50390625, 8.8427734375, 9.181640625, 9.5205078125, 9.859375, 10.1982421875, 10.537109375, 10.8759765625, 11.21484375, 11.5537109375, 11.892578125, 12.2314453125, 12.5703125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 3.0, 15.0, 11.0, 20.0, 22.0, 44.0, 62.0, 90.0, 124.0, 176.0, 324.0, 482.0, 625.0, 623.0, 475.0, 295.0, 220.0, 129.0, 98.0, 58.0, 50.0, 30.0, 28.0, 18.0, 13.0, 9.0, 7.0, 8.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.2109375, -13.7366943359375, -13.262451171875, -12.7882080078125, -12.31396484375, -11.8397216796875, -11.365478515625, -10.8912353515625, -10.4169921875, -9.9427490234375, -9.468505859375, -8.9942626953125, -8.52001953125, -8.0457763671875, -7.571533203125, -7.0972900390625, -6.623046875, -6.1488037109375, -5.674560546875, -5.2003173828125, -4.72607421875, -4.2518310546875, -3.777587890625, -3.3033447265625, -2.8291015625, -2.3548583984375, -1.880615234375, -1.4063720703125, -0.93212890625, -0.4578857421875, 0.016357421875, 0.4906005859375, 0.96484375, 1.4390869140625, 1.913330078125, 2.3875732421875, 2.86181640625, 3.3360595703125, 3.810302734375, 4.2845458984375, 4.7587890625, 5.2330322265625, 5.707275390625, 6.1815185546875, 6.65576171875, 7.1300048828125, 7.604248046875, 8.0784912109375, 8.552734375, 9.0269775390625, 9.501220703125, 9.9754638671875, 10.44970703125, 10.9239501953125, 11.398193359375, 11.8724365234375, 12.3466796875, 12.8209228515625, 13.295166015625, 13.7694091796875, 14.24365234375, 14.7178955078125, 15.192138671875, 15.6663818359375, 16.140625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 9.0, 3.0, 9.0, 15.0, 14.0, 26.0, 36.0, 54.0, 72.0, 98.0, 154.0, 264.0, 431.0, 710.0, 1723.0, 6550.0, 430786.0, 3723474.0, 24312.0, 2889.0, 1112.0, 529.0, 352.0, 204.0, 131.0, 98.0, 65.0, 43.0, 32.0, 23.0, 17.0, 7.0, 5.0, 8.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.0625, -41.53662109375, -40.0107421875, -38.48486328125, -36.958984375, -35.43310546875, -33.9072265625, -32.38134765625, -30.85546875, -29.32958984375, -27.8037109375, -26.27783203125, -24.751953125, -23.22607421875, -21.7001953125, -20.17431640625, -18.6484375, -17.12255859375, -15.5966796875, -14.07080078125, -12.544921875, -11.01904296875, -9.4931640625, -7.96728515625, -6.44140625, -4.91552734375, -3.3896484375, -1.86376953125, -0.337890625, 1.18798828125, 2.7138671875, 4.23974609375, 5.765625, 7.29150390625, 8.8173828125, 10.34326171875, 11.869140625, 13.39501953125, 14.9208984375, 16.44677734375, 17.97265625, 19.49853515625, 21.0244140625, 22.55029296875, 24.076171875, 25.60205078125, 27.1279296875, 28.65380859375, 30.1796875, 31.70556640625, 33.2314453125, 34.75732421875, 36.283203125, 37.80908203125, 39.3349609375, 40.86083984375, 42.38671875, 43.91259765625, 45.4384765625, 46.96435546875, 48.490234375, 50.01611328125, 51.5419921875, 53.06787109375, 54.59375]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 16.0, 878.0, 117.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-632.0731201171875, -619.8186645507812, -607.5641479492188, -595.3096923828125, -583.0552368164062, -570.8007202148438, -558.5462646484375, -546.291748046875, -534.0372924804688, -521.7828369140625, -509.5283508300781, -497.27386474609375, -485.0193786621094, -472.764892578125, -460.51043701171875, -448.2559509277344, -436.00146484375, -423.7469787597656, -411.4925231933594, -399.238037109375, -386.9835510253906, -374.72906494140625, -362.474609375, -350.2201232910156, -337.9656677246094, -325.711181640625, -313.45672607421875, -301.2022399902344, -288.94775390625, -276.6932678222656, -264.4388122558594, -252.184326171875, -239.9298553466797, -227.67538452148438, -215.4208984375, -203.1664276123047, -190.9119415283203, -178.657470703125, -166.40298461914062, -154.1485137939453, -141.89404296875, -129.6395721435547, -117.38508605957031, -105.130615234375, -92.87612915039062, -80.62165832519531, -68.36717987060547, -56.112701416015625, -43.85821533203125, -31.603736877441406, -19.349260330200195, -7.094783782958984, 5.159694671630859, 17.414173126220703, 29.66864776611328, 41.923126220703125, 54.17760467529297, 66.43208312988281, 78.68656158447266, 90.9410400390625, 103.19551086425781, 115.44999694824219, 127.7044677734375, 139.95895385742188, 152.2134246826172]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 8.0, 13.0, 18.0, 13.0, 17.0, 20.0, 20.0, 24.0, 37.0, 35.0, 23.0, 32.0, 33.0, 57.0, 50.0, 45.0, 37.0, 54.0, 47.0, 45.0, 51.0, 33.0, 34.0, 35.0, 34.0, 31.0, 19.0, 32.0, 17.0, 19.0, 10.0, 9.0, 11.0, 7.0, 8.0, 9.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.682403564453125, -55.01915740966797, -53.35591125488281, -51.692665100097656, -50.0294189453125, -48.366172790527344, -46.70292282104492, -45.039676666259766, -43.37643051147461, -41.71318435668945, -40.0499382019043, -38.38669204711914, -36.72344207763672, -35.06019592285156, -33.396949768066406, -31.73370361328125, -30.070457458496094, -28.407211303710938, -26.74396514892578, -25.080717086791992, -23.417470932006836, -21.75422477722168, -20.09097671508789, -18.427730560302734, -16.764484405517578, -15.101238250732422, -13.43799114227295, -11.774744033813477, -10.11149787902832, -8.448251724243164, -6.785004615783691, -5.121757507324219, -3.4585113525390625, -1.795264720916748, -0.1320180892944336, 1.5312285423278809, 3.1944751739501953, 4.857721328735352, 6.520968437194824, 8.184215545654297, 9.847461700439453, 11.51070785522461, 13.173954963684082, 14.837202072143555, 16.50044822692871, 18.163694381713867, 19.826942443847656, 21.490188598632812, 23.15343475341797, 24.816680908203125, 26.47992706298828, 28.14317512512207, 29.806421279907227, 31.469667434692383, 33.13291549682617, 34.79616165161133, 36.459407806396484, 38.12265396118164, 39.7859001159668, 41.44914627075195, 43.112396240234375, 44.77564239501953, 46.43888854980469, 48.102134704589844, 49.765380859375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 5.0, 5.0, 6.0, 11.0, 7.0, 11.0, 11.0, 13.0, 13.0, 10.0, 22.0, 11.0, 24.0, 28.0, 23.0, 36.0, 29.0, 19.0, 38.0, 26.0, 33.0, 24.0, 40.0, 37.0, 56.0, 37.0, 21.0, 33.0, 43.0, 33.0, 37.0, 27.0, 28.0, 19.0, 34.0, 14.0, 19.0, 19.0, 12.0, 14.0, 10.0, 5.0, 11.0, 8.0, 7.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-3.16796875, -3.06878662109375, -2.9696044921875, -2.87042236328125, -2.771240234375, -2.67205810546875, -2.5728759765625, -2.47369384765625, -2.37451171875, -2.27532958984375, -2.1761474609375, -2.07696533203125, -1.977783203125, -1.87860107421875, -1.7794189453125, -1.68023681640625, -1.5810546875, -1.48187255859375, -1.3826904296875, -1.28350830078125, -1.184326171875, -1.08514404296875, -0.9859619140625, -0.88677978515625, -0.78759765625, -0.68841552734375, -0.5892333984375, -0.49005126953125, -0.390869140625, -0.29168701171875, -0.1925048828125, -0.09332275390625, 0.005859375, 0.10504150390625, 0.2042236328125, 0.30340576171875, 0.402587890625, 0.50177001953125, 0.6009521484375, 0.70013427734375, 0.79931640625, 0.89849853515625, 0.9976806640625, 1.09686279296875, 1.196044921875, 1.29522705078125, 1.3944091796875, 1.49359130859375, 1.5927734375, 1.69195556640625, 1.7911376953125, 1.89031982421875, 1.989501953125, 2.08868408203125, 2.1878662109375, 2.28704833984375, 2.38623046875, 2.48541259765625, 2.5845947265625, 2.68377685546875, 2.782958984375, 2.88214111328125, 2.9813232421875, 3.08050537109375, 3.1796875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 8.0, 7.0, 11.0, 15.0, 15.0, 34.0, 43.0, 73.0, 89.0, 125.0, 150.0, 207.0, 329.0, 440.0, 585.0, 802.0, 1098.0, 1490.0, 2109.0, 2920.0, 4044.0, 5610.0, 7990.0, 11216.0, 16281.0, 24145.0, 36079.0, 56458.0, 94014.0, 201588.0, 269595.0, 114082.0, 66199.0, 41383.0, 27002.0, 18518.0, 12593.0, 8846.0, 6224.0, 4414.0, 3265.0, 2344.0, 1694.0, 1170.0, 886.0, 650.0, 498.0, 343.0, 249.0, 170.0, 143.0, 93.0, 75.0, 48.0, 30.0, 38.0, 12.0, 14.0, 7.0, 7.0, 2.0, 3.0], "bins": [-0.64453125, -0.6244888305664062, -0.6044464111328125, -0.5844039916992188, -0.564361572265625, -0.5443191528320312, -0.5242767333984375, -0.5042343139648438, -0.48419189453125, -0.46414947509765625, -0.4441070556640625, -0.42406463623046875, -0.404022216796875, -0.38397979736328125, -0.3639373779296875, -0.34389495849609375, -0.3238525390625, -0.30381011962890625, -0.2837677001953125, -0.26372528076171875, -0.243682861328125, -0.22364044189453125, -0.2035980224609375, -0.18355560302734375, -0.16351318359375, -0.14347076416015625, -0.1234283447265625, -0.10338592529296875, -0.083343505859375, -0.06330108642578125, -0.0432586669921875, -0.02321624755859375, -0.003173828125, 0.01686859130859375, 0.0369110107421875, 0.05695343017578125, 0.076995849609375, 0.09703826904296875, 0.1170806884765625, 0.13712310791015625, 0.15716552734375, 0.17720794677734375, 0.1972503662109375, 0.21729278564453125, 0.237335205078125, 0.25737762451171875, 0.2774200439453125, 0.29746246337890625, 0.3175048828125, 0.33754730224609375, 0.3575897216796875, 0.37763214111328125, 0.397674560546875, 0.41771697998046875, 0.4377593994140625, 0.45780181884765625, 0.47784423828125, 0.49788665771484375, 0.5179290771484375, 0.5379714965820312, 0.558013916015625, 0.5780563354492188, 0.5980987548828125, 0.6181411743164062, 0.63818359375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 0.0, 3.0, 1.0, 7.0, 5.0, 9.0, 12.0, 12.0, 11.0, 17.0, 20.0, 24.0, 19.0, 23.0, 26.0, 32.0, 40.0, 45.0, 33.0, 38.0, 38.0, 40.0, 62.0, 1061.0, 40.0, 39.0, 35.0, 37.0, 38.0, 36.0, 36.0, 22.0, 26.0, 27.0, 19.0, 15.0, 15.0, 13.0, 6.0, 12.0, 7.0, 8.0, 4.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.296875, -2.22100830078125, -2.1451416015625, -2.06927490234375, -1.993408203125, -1.91754150390625, -1.8416748046875, -1.76580810546875, -1.68994140625, -1.61407470703125, -1.5382080078125, -1.46234130859375, -1.386474609375, -1.31060791015625, -1.2347412109375, -1.15887451171875, -1.0830078125, -1.00714111328125, -0.9312744140625, -0.85540771484375, -0.779541015625, -0.70367431640625, -0.6278076171875, -0.55194091796875, -0.47607421875, -0.40020751953125, -0.3243408203125, -0.24847412109375, -0.172607421875, -0.09674072265625, -0.0208740234375, 0.05499267578125, 0.130859375, 0.20672607421875, 0.2825927734375, 0.35845947265625, 0.434326171875, 0.51019287109375, 0.5860595703125, 0.66192626953125, 0.73779296875, 0.81365966796875, 0.8895263671875, 0.96539306640625, 1.041259765625, 1.11712646484375, 1.1929931640625, 1.26885986328125, 1.3447265625, 1.42059326171875, 1.4964599609375, 1.57232666015625, 1.648193359375, 1.72406005859375, 1.7999267578125, 1.87579345703125, 1.95166015625, 2.02752685546875, 2.1033935546875, 2.17926025390625, 2.255126953125, 2.33099365234375, 2.4068603515625, 2.48272705078125, 2.55859375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 7.0, 8.0, 15.0, 16.0, 29.0, 36.0, 62.0, 132.0, 225.0, 360.0, 666.0, 1259.0, 2277.0, 4366.0, 8377.0, 16505.0, 33786.0, 74179.0, 193596.0, 1502302.0, 143125.0, 59484.0, 27699.0, 13689.0, 6914.0, 3639.0, 1920.0, 1051.0, 582.0, 330.0, 179.0, 108.0, 67.0, 48.0, 21.0, 23.0, 13.0, 6.0, 9.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.240234375, -1.20306396484375, -1.1658935546875, -1.12872314453125, -1.091552734375, -1.05438232421875, -1.0172119140625, -0.98004150390625, -0.94287109375, -0.90570068359375, -0.8685302734375, -0.83135986328125, -0.794189453125, -0.75701904296875, -0.7198486328125, -0.68267822265625, -0.6455078125, -0.60833740234375, -0.5711669921875, -0.53399658203125, -0.496826171875, -0.45965576171875, -0.4224853515625, -0.38531494140625, -0.34814453125, -0.31097412109375, -0.2738037109375, -0.23663330078125, -0.199462890625, -0.16229248046875, -0.1251220703125, -0.08795166015625, -0.05078125, -0.01361083984375, 0.0235595703125, 0.06072998046875, 0.097900390625, 0.13507080078125, 0.1722412109375, 0.20941162109375, 0.24658203125, 0.28375244140625, 0.3209228515625, 0.35809326171875, 0.395263671875, 0.43243408203125, 0.4696044921875, 0.50677490234375, 0.5439453125, 0.58111572265625, 0.6182861328125, 0.65545654296875, 0.692626953125, 0.72979736328125, 0.7669677734375, 0.80413818359375, 0.84130859375, 0.87847900390625, 0.9156494140625, 0.95281982421875, 0.989990234375, 1.02716064453125, 1.0643310546875, 1.10150146484375, 1.138671875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 0.0, 3.0, 1.0, 11.0, 5.0, 14.0, 14.0, 17.0, 19.0, 27.0, 25.0, 26.0, 23.0, 26.0, 36.0, 44.0, 58.0, 52.0, 73.0, 55.0, 56.0, 60.0, 51.0, 44.0, 41.0, 49.0, 34.0, 22.0, 18.0, 19.0, 19.0, 15.0, 9.0, 8.0, 10.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005059242248535156, -0.0004907883703708649, -0.0004756525158882141, -0.00046051666140556335, -0.0004453808069229126, -0.00043024495244026184, -0.0004151090979576111, -0.00039997324347496033, -0.00038483738899230957, -0.0003697015345096588, -0.00035456568002700806, -0.0003394298255443573, -0.00032429397106170654, -0.0003091581165790558, -0.00029402226209640503, -0.00027888640761375427, -0.0002637505531311035, -0.00024861469864845276, -0.000233478844165802, -0.00021834298968315125, -0.0002032071352005005, -0.00018807128071784973, -0.00017293542623519897, -0.00015779957175254822, -0.00014266371726989746, -0.0001275278627872467, -0.00011239200830459595, -9.725615382194519e-05, -8.212029933929443e-05, -6.698444485664368e-05, -5.184859037399292e-05, -3.671273589134216e-05, -2.1576881408691406e-05, -6.441026926040649e-06, 8.694827556610107e-06, 2.3830682039260864e-05, 3.896653652191162e-05, 5.410239100456238e-05, 6.923824548721313e-05, 8.437409996986389e-05, 9.950995445251465e-05, 0.0001146458089351654, 0.00012978166341781616, 0.00014491751790046692, 0.00016005337238311768, 0.00017518922686576843, 0.0001903250813484192, 0.00020546093583106995, 0.0002205967903137207, 0.00023573264479637146, 0.0002508684992790222, 0.000266004353761673, 0.00028114020824432373, 0.0002962760627269745, 0.00031141191720962524, 0.000326547771692276, 0.00034168362617492676, 0.0003568194806575775, 0.00037195533514022827, 0.00038709118962287903, 0.0004022270441055298, 0.00041736289858818054, 0.0004324987530708313, 0.00044763460755348206, 0.0004627704620361328]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 4.0, 5.0, 10.0, 4.0, 15.0, 17.0, 23.0, 28.0, 43.0, 45.0, 69.0, 79.0, 94.0, 102.0, 155.0, 202.0, 264.0, 389.0, 544.0, 1502.0, 1031755.0, 10804.0, 673.0, 435.0, 307.0, 205.0, 184.0, 120.0, 83.0, 80.0, 62.0, 69.0, 42.0, 36.0, 29.0, 13.0, 13.0, 9.0, 6.0, 4.0, 3.0, 5.0, 3.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00835418701171875, -0.008081912994384766, -0.007809638977050781, -0.007537364959716797, -0.0072650909423828125, -0.006992816925048828, -0.006720542907714844, -0.006448268890380859, -0.006175994873046875, -0.005903720855712891, -0.005631446838378906, -0.005359172821044922, -0.0050868988037109375, -0.004814624786376953, -0.004542350769042969, -0.004270076751708984, -0.003997802734375, -0.0037255287170410156, -0.0034532546997070312, -0.003180980682373047, -0.0029087066650390625, -0.002636432647705078, -0.0023641586303710938, -0.0020918846130371094, -0.001819610595703125, -0.0015473365783691406, -0.0012750625610351562, -0.0010027885437011719, -0.0007305145263671875, -0.0004582405090332031, -0.00018596649169921875, 8.630752563476562e-05, 0.00035858154296875, 0.0006308555603027344, 0.0009031295776367188, 0.0011754035949707031, 0.0014476776123046875, 0.0017199516296386719, 0.0019922256469726562, 0.0022644996643066406, 0.002536773681640625, 0.0028090476989746094, 0.0030813217163085938, 0.003353595733642578, 0.0036258697509765625, 0.003898143768310547, 0.004170417785644531, 0.004442691802978516, 0.0047149658203125, 0.004987239837646484, 0.005259513854980469, 0.005531787872314453, 0.0058040618896484375, 0.006076335906982422, 0.006348609924316406, 0.006620883941650391, 0.006893157958984375, 0.007165431976318359, 0.007437705993652344, 0.007709980010986328, 0.007982254028320312, 0.008254528045654297, 0.008526802062988281, 0.008799076080322266, 0.00907135009765625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 22.0, 670.0, 316.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016195368953049183, -0.0015716691268607974, -0.0015238014748319983, -0.0014759337063878775, -0.0014280660543590784, -0.0013801982859149575, -0.0013323305174708366, -0.0012844628654420376, -0.0012365952134132385, -0.0011887274449691176, -0.0011408597929403186, -0.0010929920244961977, -0.0010451243724673986, -0.0009972566040232778, -0.0009493888937868178, -0.0009015211835503578, -0.0008536534151062369, -0.000805785704869777, -0.000757917994633317, -0.0007100502261891961, -0.000662182574160397, -0.0006143148057162762, -0.0005664470954798162, -0.0005185793852433562, -0.00047071167500689626, -0.0004228439647704363, -0.0003749762545339763, -0.0003271085151936859, -0.0002792408049572259, -0.00023137309472076595, -0.00018350535538047552, -0.00013563764514401555, -8.777005132287741e-05, -3.990233381045982e-05, 7.965383701957762e-06, 5.583310849033296e-05, 0.00010370081872679293, 0.0001515685289632529, 0.00019943626830354333, 0.0002473039785400033, 0.00029517168877646327, 0.00034303939901292324, 0.0003909071092493832, 0.00043877484858967364, 0.0004866425588261336, 0.0005345102399587631, 0.000582378008402884, 0.000630245718639344, 0.000678113428875804, 0.0007259811391122639, 0.0007738488493487239, 0.0008217166177928448, 0.0008695842698216438, 0.0009174520382657647, 0.0009653197485022247, 0.0010131874587386847, 0.0010610551107674837, 0.0011089228792116046, 0.0011567905312404037, 0.0012046582996845245, 0.0012525259517133236, 0.0013003937201574445, 0.0013482614886015654, 0.0013961291406303644, 0.0014439969090744853]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 7.0, 0.0, 2.0, 1.0, 8.0, 7.0, 6.0, 11.0, 10.0, 10.0, 7.0, 19.0, 13.0, 20.0, 23.0, 26.0, 25.0, 22.0, 26.0, 23.0, 48.0, 41.0, 37.0, 28.0, 37.0, 42.0, 48.0, 43.0, 38.0, 36.0, 26.0, 37.0, 23.0, 33.0, 21.0, 28.0, 22.0, 20.0, 20.0, 19.0, 14.0, 14.0, 19.0, 5.0, 8.0, 10.0, 6.0, 7.0, 6.0, 7.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00020951032638549805, -0.00020232144743204117, -0.0001951325684785843, -0.0001879436895251274, -0.00018075481057167053, -0.00017356593161821365, -0.00016637705266475677, -0.0001591881737112999, -0.00015199929475784302, -0.00014481041580438614, -0.00013762153685092926, -0.00013043265789747238, -0.0001232437789440155, -0.00011605489999055862, -0.00010886602103710175, -0.00010167714208364487, -9.448826313018799e-05, -8.729938417673111e-05, -8.011050522327423e-05, -7.292162626981735e-05, -6.573274731636047e-05, -5.8543868362903595e-05, -5.1354989409446716e-05, -4.416611045598984e-05, -3.697723150253296e-05, -2.978835254907608e-05, -2.25994735956192e-05, -1.5410594642162323e-05, -8.221715688705444e-06, -1.0328367352485657e-06, 6.156042218208313e-06, 1.3344921171665192e-05, 2.053380012512207e-05, 2.772267907857895e-05, 3.491155803203583e-05, 4.2100436985492706e-05, 4.9289315938949585e-05, 5.6478194892406464e-05, 6.366707384586334e-05, 7.085595279932022e-05, 7.80448317527771e-05, 8.523371070623398e-05, 9.242258965969086e-05, 9.961146861314774e-05, 0.00010680034756660461, 0.00011398922652006149, 0.00012117810547351837, 0.00012836698442697525, 0.00013555586338043213, 0.000142744742333889, 0.00014993362128734589, 0.00015712250024080276, 0.00016431137919425964, 0.00017150025814771652, 0.0001786891371011734, 0.00018587801605463028, 0.00019306689500808716, 0.00020025577396154404, 0.00020744465291500092, 0.0002146335318684578, 0.00022182241082191467, 0.00022901128977537155, 0.00023620016872882843, 0.0002433890476822853, 0.0002505779266357422]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 5.0, 5.0, 6.0, 11.0, 7.0, 11.0, 11.0, 13.0, 13.0, 10.0, 22.0, 11.0, 24.0, 28.0, 23.0, 36.0, 29.0, 19.0, 38.0, 26.0, 33.0, 24.0, 40.0, 38.0, 55.0, 37.0, 21.0, 33.0, 43.0, 33.0, 37.0, 27.0, 27.0, 20.0, 34.0, 14.0, 19.0, 19.0, 12.0, 14.0, 10.0, 5.0, 11.0, 8.0, 7.0, 8.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-3.16796875, -3.06878662109375, -2.9696044921875, -2.87042236328125, -2.771240234375, -2.67205810546875, -2.5728759765625, -2.47369384765625, -2.37451171875, -2.27532958984375, -2.1761474609375, -2.07696533203125, -1.977783203125, -1.87860107421875, -1.7794189453125, -1.68023681640625, -1.5810546875, -1.48187255859375, -1.3826904296875, -1.28350830078125, -1.184326171875, -1.08514404296875, -0.9859619140625, -0.88677978515625, -0.78759765625, -0.68841552734375, -0.5892333984375, -0.49005126953125, -0.390869140625, -0.29168701171875, -0.1925048828125, -0.09332275390625, 0.005859375, 0.10504150390625, 0.2042236328125, 0.30340576171875, 0.402587890625, 0.50177001953125, 0.6009521484375, 0.70013427734375, 0.79931640625, 0.89849853515625, 0.9976806640625, 1.09686279296875, 1.196044921875, 1.29522705078125, 1.3944091796875, 1.49359130859375, 1.5927734375, 1.69195556640625, 1.7911376953125, 1.89031982421875, 1.989501953125, 2.08868408203125, 2.1878662109375, 2.28704833984375, 2.38623046875, 2.48541259765625, 2.5845947265625, 2.68377685546875, 2.782958984375, 2.88214111328125, 2.9813232421875, 3.08050537109375, 3.1796875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 8.0, 14.0, 11.0, 24.0, 26.0, 36.0, 56.0, 75.0, 71.0, 129.0, 181.0, 238.0, 343.0, 463.0, 670.0, 956.0, 1253.0, 1911.0, 2877.0, 4498.0, 7985.0, 19197.0, 156833.0, 785293.0, 37036.0, 11464.0, 5852.0, 3323.0, 2363.0, 1552.0, 1145.0, 698.0, 530.0, 410.0, 260.0, 210.0, 146.0, 111.0, 74.0, 66.0, 49.0, 39.0, 19.0, 12.0, 16.0, 8.0, 9.0, 3.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-22.546875, -21.824951171875, -21.10302734375, -20.381103515625, -19.6591796875, -18.937255859375, -18.21533203125, -17.493408203125, -16.771484375, -16.049560546875, -15.32763671875, -14.605712890625, -13.8837890625, -13.161865234375, -12.43994140625, -11.718017578125, -10.99609375, -10.274169921875, -9.55224609375, -8.830322265625, -8.1083984375, -7.386474609375, -6.66455078125, -5.942626953125, -5.220703125, -4.498779296875, -3.77685546875, -3.054931640625, -2.3330078125, -1.611083984375, -0.88916015625, -0.167236328125, 0.5546875, 1.276611328125, 1.99853515625, 2.720458984375, 3.4423828125, 4.164306640625, 4.88623046875, 5.608154296875, 6.330078125, 7.052001953125, 7.77392578125, 8.495849609375, 9.2177734375, 9.939697265625, 10.66162109375, 11.383544921875, 12.10546875, 12.827392578125, 13.54931640625, 14.271240234375, 14.9931640625, 15.715087890625, 16.43701171875, 17.158935546875, 17.880859375, 18.602783203125, 19.32470703125, 20.046630859375, 20.7685546875, 21.490478515625, 22.21240234375, 22.934326171875, 23.65625]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 9.0, 6.0, 7.0, 12.0, 19.0, 12.0, 15.0, 12.0, 34.0, 26.0, 32.0, 31.0, 32.0, 33.0, 30.0, 57.0, 41.0, 108.0, 385.0, 1518.0, 141.0, 76.0, 43.0, 42.0, 45.0, 27.0, 29.0, 29.0, 28.0, 24.0, 23.0, 14.0, 16.0, 19.0, 10.0, 5.0, 11.0, 10.0, 5.0, 6.0, 4.0, 3.0, 5.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0859375, -9.7392578125, -9.392578125, -9.0458984375, -8.69921875, -8.3525390625, -8.005859375, -7.6591796875, -7.3125, -6.9658203125, -6.619140625, -6.2724609375, -5.92578125, -5.5791015625, -5.232421875, -4.8857421875, -4.5390625, -4.1923828125, -3.845703125, -3.4990234375, -3.15234375, -2.8056640625, -2.458984375, -2.1123046875, -1.765625, -1.4189453125, -1.072265625, -0.7255859375, -0.37890625, -0.0322265625, 0.314453125, 0.6611328125, 1.0078125, 1.3544921875, 1.701171875, 2.0478515625, 2.39453125, 2.7412109375, 3.087890625, 3.4345703125, 3.78125, 4.1279296875, 4.474609375, 4.8212890625, 5.16796875, 5.5146484375, 5.861328125, 6.2080078125, 6.5546875, 6.9013671875, 7.248046875, 7.5947265625, 7.94140625, 8.2880859375, 8.634765625, 8.9814453125, 9.328125, 9.6748046875, 10.021484375, 10.3681640625, 10.71484375, 11.0615234375, 11.408203125, 11.7548828125, 12.1015625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 9.0, 12.0, 4.0, 8.0, 10.0, 17.0, 11.0, 16.0, 20.0, 34.0, 27.0, 35.0, 31.0, 45.0, 44.0, 101.0, 190.0, 520.0, 3278.0, 3100577.0, 39019.0, 928.0, 267.0, 121.0, 61.0, 58.0, 42.0, 28.0, 25.0, 28.0, 24.0, 14.0, 16.0, 12.0, 17.0, 10.0, 10.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0], "bins": [-54.71875, -53.14208984375, -51.5654296875, -49.98876953125, -48.412109375, -46.83544921875, -45.2587890625, -43.68212890625, -42.10546875, -40.52880859375, -38.9521484375, -37.37548828125, -35.798828125, -34.22216796875, -32.6455078125, -31.06884765625, -29.4921875, -27.91552734375, -26.3388671875, -24.76220703125, -23.185546875, -21.60888671875, -20.0322265625, -18.45556640625, -16.87890625, -15.30224609375, -13.7255859375, -12.14892578125, -10.572265625, -8.99560546875, -7.4189453125, -5.84228515625, -4.265625, -2.68896484375, -1.1123046875, 0.46435546875, 2.041015625, 3.61767578125, 5.1943359375, 6.77099609375, 8.34765625, 9.92431640625, 11.5009765625, 13.07763671875, 14.654296875, 16.23095703125, 17.8076171875, 19.38427734375, 20.9609375, 22.53759765625, 24.1142578125, 25.69091796875, 27.267578125, 28.84423828125, 30.4208984375, 31.99755859375, 33.57421875, 35.15087890625, 36.7275390625, 38.30419921875, 39.880859375, 41.45751953125, 43.0341796875, 44.61083984375, 46.1875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [332.0, 687.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.07246208190918, -0.2906932830810547, 16.49107551574707, 33.27284240722656, 50.05461120605469, 66.83638000488281, 83.61814880371094, 100.39991760253906, 117.18168640136719, 133.9634552001953, 150.74522399902344, 167.52699279785156, 184.3087615966797, 201.0905303955078, 217.87229919433594, 234.65406799316406, 251.4358367919922, 268.21759033203125, 284.9993896484375, 301.7811279296875, 318.56292724609375, 335.34466552734375, 352.12646484375, 368.908203125, 385.69000244140625, 402.4717712402344, 419.2535400390625, 436.0353088378906, 452.81707763671875, 469.5988464355469, 486.380615234375, 503.1623840332031, 519.944091796875, 536.725830078125, 553.5076293945312, 570.2894287109375, 587.0711669921875, 603.8529052734375, 620.6347045898438, 637.41650390625, 654.1982421875, 670.97998046875, 687.7617797851562, 704.5435791015625, 721.3253173828125, 738.1070556640625, 754.8888549804688, 771.670654296875, 788.452392578125, 805.234130859375, 822.0159301757812, 838.7977294921875, 855.5794677734375, 872.3612060546875, 889.1430053710938, 905.9248046875, 922.70654296875, 939.48828125, 956.2700805664062, 973.0518798828125, 989.8336181640625, 1006.6153564453125, 1023.3971557617188, 1040.178955078125, 1056.960693359375]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 7.0, 3.0, 1.0, 7.0, 6.0, 7.0, 13.0, 11.0, 17.0, 25.0, 26.0, 29.0, 32.0, 33.0, 33.0, 35.0, 48.0, 37.0, 36.0, 46.0, 45.0, 49.0, 45.0, 54.0, 38.0, 39.0, 52.0, 37.0, 39.0, 23.0, 21.0, 19.0, 24.0, 19.0, 11.0, 14.0, 9.0, 3.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.91167449951172, -34.55258560180664, -33.19349670410156, -31.834407806396484, -30.475317001342773, -29.116228103637695, -27.757139205932617, -26.398048400878906, -25.038959503173828, -23.67987060546875, -22.320781707763672, -20.961692810058594, -19.602602005004883, -18.243513107299805, -16.884424209594727, -15.525334358215332, -14.16624641418457, -12.807157516479492, -11.448067665100098, -10.08897876739502, -8.729888916015625, -7.370800018310547, -6.011711120605469, -4.652621269226074, -3.293532371520996, -1.9344431161880493, -0.5753538608551025, 0.7837352752685547, 2.142824649810791, 3.5019140243530273, 4.8610029220581055, 6.2200927734375, 7.579181671142578, 8.938270568847656, 10.29736042022705, 11.656449317932129, 13.015539169311523, 14.374628067016602, 15.73371696472168, 17.09280776977539, 18.45189666748047, 19.810985565185547, 21.170074462890625, 22.529163360595703, 23.888254165649414, 25.247343063354492, 26.60643196105957, 27.96552276611328, 29.324609756469727, 30.683698654174805, 32.042789459228516, 33.401878356933594, 34.76096725463867, 36.12005615234375, 37.47914505004883, 38.838233947753906, 40.197322845458984, 41.55641174316406, 42.91550064086914, 44.27458953857422, 45.6336784362793, 46.992767333984375, 48.35186004638672, 49.7109489440918, 51.070037841796875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 8.0, 8.0, 13.0, 7.0, 8.0, 15.0, 11.0, 17.0, 20.0, 17.0, 24.0, 27.0, 21.0, 31.0, 25.0, 25.0, 32.0, 29.0, 45.0, 30.0, 38.0, 34.0, 41.0, 43.0, 41.0, 35.0, 40.0, 40.0, 28.0, 22.0, 23.0, 25.0, 21.0, 28.0, 22.0, 10.0, 13.0, 13.0, 9.0, 7.0, 8.0, 7.0, 9.0, 9.0, 6.0, 2.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0], "bins": [-3.4140625, -3.306549072265625, -3.19903564453125, -3.091522216796875, -2.9840087890625, -2.876495361328125, -2.76898193359375, -2.661468505859375, -2.553955078125, -2.446441650390625, -2.33892822265625, -2.231414794921875, -2.1239013671875, -2.016387939453125, -1.90887451171875, -1.801361083984375, -1.69384765625, -1.586334228515625, -1.47882080078125, -1.371307373046875, -1.2637939453125, -1.156280517578125, -1.04876708984375, -0.941253662109375, -0.833740234375, -0.726226806640625, -0.61871337890625, -0.511199951171875, -0.4036865234375, -0.296173095703125, -0.18865966796875, -0.081146240234375, 0.0263671875, 0.133880615234375, 0.24139404296875, 0.348907470703125, 0.4564208984375, 0.563934326171875, 0.67144775390625, 0.778961181640625, 0.886474609375, 0.993988037109375, 1.10150146484375, 1.209014892578125, 1.3165283203125, 1.424041748046875, 1.53155517578125, 1.639068603515625, 1.74658203125, 1.854095458984375, 1.96160888671875, 2.069122314453125, 2.1766357421875, 2.284149169921875, 2.39166259765625, 2.499176025390625, 2.606689453125, 2.714202880859375, 2.82171630859375, 2.929229736328125, 3.0367431640625, 3.144256591796875, 3.25177001953125, 3.359283447265625, 3.466796875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 3.0, 5.0, 4.0, 3.0, 12.0, 16.0, 18.0, 22.0, 28.0, 48.0, 64.0, 92.0, 129.0, 196.0, 309.0, 520.0, 902.0, 1584.0, 3161.0, 6588.0, 16480.0, 56832.0, 964317.0, 2970973.0, 127628.0, 25295.0, 9750.0, 4382.0, 2188.0, 1105.0, 602.0, 324.0, 199.0, 152.0, 104.0, 81.0, 43.0, 31.0, 19.0, 13.0, 13.0, 9.0, 11.0, 11.0, 7.0, 4.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-22.625, -21.943603515625, -21.26220703125, -20.580810546875, -19.8994140625, -19.218017578125, -18.53662109375, -17.855224609375, -17.173828125, -16.492431640625, -15.81103515625, -15.129638671875, -14.4482421875, -13.766845703125, -13.08544921875, -12.404052734375, -11.72265625, -11.041259765625, -10.35986328125, -9.678466796875, -8.9970703125, -8.315673828125, -7.63427734375, -6.952880859375, -6.271484375, -5.590087890625, -4.90869140625, -4.227294921875, -3.5458984375, -2.864501953125, -2.18310546875, -1.501708984375, -0.8203125, -0.138916015625, 0.54248046875, 1.223876953125, 1.9052734375, 2.586669921875, 3.26806640625, 3.949462890625, 4.630859375, 5.312255859375, 5.99365234375, 6.675048828125, 7.3564453125, 8.037841796875, 8.71923828125, 9.400634765625, 10.08203125, 10.763427734375, 11.44482421875, 12.126220703125, 12.8076171875, 13.489013671875, 14.17041015625, 14.851806640625, 15.533203125, 16.214599609375, 16.89599609375, 17.577392578125, 18.2587890625, 18.940185546875, 19.62158203125, 20.302978515625, 20.984375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 8.0, 8.0, 15.0, 29.0, 48.0, 104.0, 189.0, 366.0, 756.0, 942.0, 716.0, 378.0, 200.0, 128.0, 68.0, 48.0, 30.0, 28.0, 10.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-41.59375, -40.6142578125, -39.634765625, -38.6552734375, -37.67578125, -36.6962890625, -35.716796875, -34.7373046875, -33.7578125, -32.7783203125, -31.798828125, -30.8193359375, -29.83984375, -28.8603515625, -27.880859375, -26.9013671875, -25.921875, -24.9423828125, -23.962890625, -22.9833984375, -22.00390625, -21.0244140625, -20.044921875, -19.0654296875, -18.0859375, -17.1064453125, -16.126953125, -15.1474609375, -14.16796875, -13.1884765625, -12.208984375, -11.2294921875, -10.25, -9.2705078125, -8.291015625, -7.3115234375, -6.33203125, -5.3525390625, -4.373046875, -3.3935546875, -2.4140625, -1.4345703125, -0.455078125, 0.5244140625, 1.50390625, 2.4833984375, 3.462890625, 4.4423828125, 5.421875, 6.4013671875, 7.380859375, 8.3603515625, 9.33984375, 10.3193359375, 11.298828125, 12.2783203125, 13.2578125, 14.2373046875, 15.216796875, 16.1962890625, 17.17578125, 18.1552734375, 19.134765625, 20.1142578125, 21.09375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 9.0, 20.0, 28.0, 58.0, 75.0, 129.0, 246.0, 543.0, 5542.0, 4184190.0, 2697.0, 406.0, 164.0, 76.0, 39.0, 35.0, 10.0, 11.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.0625, -103.2451171875, -98.427734375, -93.6103515625, -88.79296875, -83.9755859375, -79.158203125, -74.3408203125, -69.5234375, -64.7060546875, -59.888671875, -55.0712890625, -50.25390625, -45.4365234375, -40.619140625, -35.8017578125, -30.984375, -26.1669921875, -21.349609375, -16.5322265625, -11.71484375, -6.8974609375, -2.080078125, 2.7373046875, 7.5546875, 12.3720703125, 17.189453125, 22.0068359375, 26.82421875, 31.6416015625, 36.458984375, 41.2763671875, 46.09375, 50.9111328125, 55.728515625, 60.5458984375, 65.36328125, 70.1806640625, 74.998046875, 79.8154296875, 84.6328125, 89.4501953125, 94.267578125, 99.0849609375, 103.90234375, 108.7197265625, 113.537109375, 118.3544921875, 123.171875, 127.9892578125, 132.806640625, 137.6240234375, 142.44140625, 147.2587890625, 152.076171875, 156.8935546875, 161.7109375, 166.5283203125, 171.345703125, 176.1630859375, 180.98046875, 185.7978515625, 190.615234375, 195.4326171875, 200.25]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 461.0, 550.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.27412033081055, -43.03511428833008, -28.796110153198242, -14.557106018066406, -0.3180999755859375, 13.920902252197266, 28.159908294677734, 42.3989143371582, 56.63792037963867, 70.87692260742188, 85.11592864990234, 99.35493469238281, 113.59394073486328, 127.83294677734375, 142.0719451904297, 156.3109588623047, 170.54995727539062, 184.78895568847656, 199.02796936035156, 213.2669677734375, 227.5059814453125, 241.74497985839844, 255.98397827148438, 270.2229919433594, 284.4620056152344, 298.7010192871094, 312.94000244140625, 327.17901611328125, 341.41802978515625, 355.65704345703125, 369.8960266113281, 384.1350402832031, 398.3740539550781, 412.6130676269531, 426.85205078125, 441.091064453125, 455.330078125, 469.569091796875, 483.8080749511719, 498.0470886230469, 512.2860717773438, 526.5250854492188, 540.7640991210938, 555.0031127929688, 569.2420654296875, 583.4810791015625, 597.7200927734375, 611.9591064453125, 626.1981201171875, 640.4371337890625, 654.6761474609375, 668.9151611328125, 683.1541137695312, 697.3931274414062, 711.6321411132812, 725.8711547851562, 740.1101684570312, 754.3491821289062, 768.5881958007812, 782.8272094726562, 797.066162109375, 811.30517578125, 825.544189453125, 839.783203125, 854.022216796875]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 5.0, 14.0, 14.0, 9.0, 17.0, 19.0, 23.0, 19.0, 28.0, 25.0, 24.0, 26.0, 37.0, 36.0, 49.0, 39.0, 46.0, 34.0, 45.0, 41.0, 39.0, 37.0, 54.0, 36.0, 36.0, 25.0, 28.0, 34.0, 19.0, 19.0, 21.0, 15.0, 10.0, 11.0, 11.0, 5.0, 6.0, 8.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-81.18515014648438, -78.84532165527344, -76.50550079345703, -74.16567993164062, -71.82585144042969, -69.48602294921875, -67.14620208740234, -64.80638122558594, -62.466552734375, -60.12672805786133, -57.786903381347656, -55.447078704833984, -53.10725402832031, -50.76742935180664, -48.42760467529297, -46.0877799987793, -43.747955322265625, -41.40813064575195, -39.06830596923828, -36.72848129272461, -34.38865661621094, -32.048831939697266, -29.709007263183594, -27.369182586669922, -25.02935791015625, -22.689533233642578, -20.349708557128906, -18.009883880615234, -15.670059204101562, -13.33023452758789, -10.990409851074219, -8.650585174560547, -6.310760498046875, -3.970935821533203, -1.6311111450195312, 0.7087135314941406, 3.0485382080078125, 5.388362884521484, 7.728187561035156, 10.068012237548828, 12.4078369140625, 14.747661590576172, 17.087486267089844, 19.427310943603516, 21.767135620117188, 24.10696029663086, 26.44678497314453, 28.786609649658203, 31.126434326171875, 33.46625900268555, 35.80608367919922, 38.14590835571289, 40.48573303222656, 42.825557708740234, 45.165382385253906, 47.50520706176758, 49.84503173828125, 52.18485641479492, 54.524681091308594, 56.864505767822266, 59.20433044433594, 61.54415512084961, 63.88397979736328, 66.22380065917969, 68.56362915039062]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 4.0, 8.0, 11.0, 5.0, 12.0, 9.0, 8.0, 9.0, 12.0, 20.0, 16.0, 18.0, 26.0, 40.0, 24.0, 26.0, 35.0, 36.0, 43.0, 23.0, 38.0, 36.0, 35.0, 40.0, 41.0, 39.0, 27.0, 38.0, 37.0, 36.0, 29.0, 30.0, 20.0, 21.0, 20.0, 14.0, 14.0, 15.0, 13.0, 9.0, 10.0, 8.0, 12.0, 11.0, 6.0, 1.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.412109375, -3.3017578125, -3.19140625, -3.0810546875, -2.970703125, -2.8603515625, -2.75, -2.6396484375, -2.529296875, -2.4189453125, -2.30859375, -2.1982421875, -2.087890625, -1.9775390625, -1.8671875, -1.7568359375, -1.646484375, -1.5361328125, -1.42578125, -1.3154296875, -1.205078125, -1.0947265625, -0.984375, -0.8740234375, -0.763671875, -0.6533203125, -0.54296875, -0.4326171875, -0.322265625, -0.2119140625, -0.1015625, 0.0087890625, 0.119140625, 0.2294921875, 0.33984375, 0.4501953125, 0.560546875, 0.6708984375, 0.78125, 0.8916015625, 1.001953125, 1.1123046875, 1.22265625, 1.3330078125, 1.443359375, 1.5537109375, 1.6640625, 1.7744140625, 1.884765625, 1.9951171875, 2.10546875, 2.2158203125, 2.326171875, 2.4365234375, 2.546875, 2.6572265625, 2.767578125, 2.8779296875, 2.98828125, 3.0986328125, 3.208984375, 3.3193359375, 3.4296875, 3.5400390625, 3.650390625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 10.0, 8.0, 9.0, 13.0, 14.0, 27.0, 41.0, 50.0, 93.0, 102.0, 167.0, 267.0, 380.0, 575.0, 852.0, 1308.0, 2099.0, 3047.0, 4607.0, 7317.0, 11426.0, 18939.0, 31733.0, 56518.0, 111056.0, 290531.0, 267986.0, 105284.0, 54012.0, 30407.0, 18185.0, 11078.0, 7110.0, 4444.0, 2996.0, 2052.0, 1265.0, 853.0, 560.0, 371.0, 249.0, 163.0, 98.0, 77.0, 61.0, 34.0, 26.0, 19.0, 3.0, 10.0, 13.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0], "bins": [-0.94384765625, -0.9152145385742188, -0.8865814208984375, -0.8579483032226562, -0.829315185546875, -0.8006820678710938, -0.7720489501953125, -0.7434158325195312, -0.71478271484375, -0.6861495971679688, -0.6575164794921875, -0.6288833618164062, -0.600250244140625, -0.5716171264648438, -0.5429840087890625, -0.5143508911132812, -0.4857177734375, -0.45708465576171875, -0.4284515380859375, -0.39981842041015625, -0.371185302734375, -0.34255218505859375, -0.3139190673828125, -0.28528594970703125, -0.25665283203125, -0.22801971435546875, -0.1993865966796875, -0.17075347900390625, -0.142120361328125, -0.11348724365234375, -0.0848541259765625, -0.05622100830078125, -0.027587890625, 0.00104522705078125, 0.0296783447265625, 0.05831146240234375, 0.086944580078125, 0.11557769775390625, 0.1442108154296875, 0.17284393310546875, 0.20147705078125, 0.23011016845703125, 0.2587432861328125, 0.28737640380859375, 0.316009521484375, 0.34464263916015625, 0.3732757568359375, 0.40190887451171875, 0.4305419921875, 0.45917510986328125, 0.4878082275390625, 0.5164413452148438, 0.545074462890625, 0.5737075805664062, 0.6023406982421875, 0.6309738159179688, 0.65960693359375, 0.6882400512695312, 0.7168731689453125, 0.7455062866210938, 0.774139404296875, 0.8027725219726562, 0.8314056396484375, 0.8600387573242188, 0.888671875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 3.0, 6.0, 9.0, 5.0, 13.0, 13.0, 8.0, 9.0, 17.0, 19.0, 22.0, 24.0, 28.0, 36.0, 32.0, 28.0, 33.0, 36.0, 25.0, 44.0, 35.0, 1069.0, 46.0, 45.0, 49.0, 39.0, 39.0, 44.0, 32.0, 21.0, 23.0, 25.0, 21.0, 31.0, 17.0, 16.0, 26.0, 12.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-2.62109375, -2.540863037109375, -2.46063232421875, -2.380401611328125, -2.3001708984375, -2.219940185546875, -2.13970947265625, -2.059478759765625, -1.979248046875, -1.899017333984375, -1.81878662109375, -1.738555908203125, -1.6583251953125, -1.578094482421875, -1.49786376953125, -1.417633056640625, -1.33740234375, -1.257171630859375, -1.17694091796875, -1.096710205078125, -1.0164794921875, -0.936248779296875, -0.85601806640625, -0.775787353515625, -0.695556640625, -0.615325927734375, -0.53509521484375, -0.454864501953125, -0.3746337890625, -0.294403076171875, -0.21417236328125, -0.133941650390625, -0.0537109375, 0.026519775390625, 0.10675048828125, 0.186981201171875, 0.2672119140625, 0.347442626953125, 0.42767333984375, 0.507904052734375, 0.588134765625, 0.668365478515625, 0.74859619140625, 0.828826904296875, 0.9090576171875, 0.989288330078125, 1.06951904296875, 1.149749755859375, 1.22998046875, 1.310211181640625, 1.39044189453125, 1.470672607421875, 1.5509033203125, 1.631134033203125, 1.71136474609375, 1.791595458984375, 1.871826171875, 1.952056884765625, 2.03228759765625, 2.112518310546875, 2.1927490234375, 2.272979736328125, 2.35321044921875, 2.433441162109375, 2.513671875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 1.0, 4.0, 6.0, 6.0, 8.0, 17.0, 41.0, 52.0, 81.0, 137.0, 212.0, 392.0, 583.0, 1183.0, 2209.0, 4055.0, 8042.0, 15901.0, 32358.0, 68350.0, 169033.0, 1503682.0, 161370.0, 65647.0, 31735.0, 15302.0, 7818.0, 4132.0, 2124.0, 1081.0, 651.0, 362.0, 208.0, 129.0, 82.0, 41.0, 29.0, 15.0, 15.0, 12.0, 5.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2373046875, -1.197998046875, -1.15869140625, -1.119384765625, -1.080078125, -1.040771484375, -1.00146484375, -0.962158203125, -0.9228515625, -0.883544921875, -0.84423828125, -0.804931640625, -0.765625, -0.726318359375, -0.68701171875, -0.647705078125, -0.6083984375, -0.569091796875, -0.52978515625, -0.490478515625, -0.451171875, -0.411865234375, -0.37255859375, -0.333251953125, -0.2939453125, -0.254638671875, -0.21533203125, -0.176025390625, -0.13671875, -0.097412109375, -0.05810546875, -0.018798828125, 0.0205078125, 0.059814453125, 0.09912109375, 0.138427734375, 0.177734375, 0.217041015625, 0.25634765625, 0.295654296875, 0.3349609375, 0.374267578125, 0.41357421875, 0.452880859375, 0.4921875, 0.531494140625, 0.57080078125, 0.610107421875, 0.6494140625, 0.688720703125, 0.72802734375, 0.767333984375, 0.806640625, 0.845947265625, 0.88525390625, 0.924560546875, 0.9638671875, 1.003173828125, 1.04248046875, 1.081787109375, 1.12109375, 1.160400390625, 1.19970703125, 1.239013671875, 1.2783203125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 1.0, 7.0, 6.0, 13.0, 5.0, 11.0, 12.0, 26.0, 24.0, 40.0, 37.0, 34.0, 26.0, 45.0, 54.0, 58.0, 64.0, 53.0, 68.0, 58.0, 48.0, 57.0, 46.0, 48.0, 40.0, 19.0, 25.0, 12.0, 20.0, 10.0, 3.0, 5.0, 3.0, 3.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005168914794921875, -0.0005007311701774597, -0.00048457086086273193, -0.00046841055154800415, -0.00045225024223327637, -0.0004360899329185486, -0.0004199296236038208, -0.000403769314289093, -0.00038760900497436523, -0.00037144869565963745, -0.00035528838634490967, -0.0003391280770301819, -0.0003229677677154541, -0.0003068074584007263, -0.00029064714908599854, -0.00027448683977127075, -0.00025832653045654297, -0.00024216622114181519, -0.0002260059118270874, -0.00020984560251235962, -0.00019368529319763184, -0.00017752498388290405, -0.00016136467456817627, -0.00014520436525344849, -0.0001290440559387207, -0.00011288374662399292, -9.672343730926514e-05, -8.056312799453735e-05, -6.440281867980957e-05, -4.824250936508179e-05, -3.2082200050354004e-05, -1.592189073562622e-05, 2.384185791015625e-07, 1.6398727893829346e-05, 3.255903720855713e-05, 4.871934652328491e-05, 6.48796558380127e-05, 8.103996515274048e-05, 9.720027446746826e-05, 0.00011336058378219604, 0.00012952089309692383, 0.0001456812024116516, 0.0001618415117263794, 0.00017800182104110718, 0.00019416213035583496, 0.00021032243967056274, 0.00022648274898529053, 0.0002426430583000183, 0.0002588033676147461, 0.0002749636769294739, 0.00029112398624420166, 0.00030728429555892944, 0.0003234446048736572, 0.000339604914188385, 0.0003557652235031128, 0.0003719255328178406, 0.00038808584213256836, 0.00040424615144729614, 0.0004204064607620239, 0.0004365667700767517, 0.0004527270793914795, 0.0004688873887062073, 0.00048504769802093506, 0.0005012080073356628, 0.0005173683166503906]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 4.0, 0.0, 2.0, 4.0, 7.0, 2.0, 7.0, 5.0, 7.0, 13.0, 23.0, 29.0, 38.0, 34.0, 53.0, 62.0, 114.0, 175.0, 239.0, 472.0, 1336.0, 1039084.0, 5363.0, 586.0, 298.0, 166.0, 114.0, 67.0, 65.0, 45.0, 32.0, 24.0, 19.0, 10.0, 14.0, 10.0, 4.0, 2.0, 9.0, 6.0, 5.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.013092041015625, -0.012691020965576172, -0.012290000915527344, -0.011888980865478516, -0.011487960815429688, -0.01108694076538086, -0.010685920715332031, -0.010284900665283203, -0.009883880615234375, -0.009482860565185547, -0.009081840515136719, -0.00868082046508789, -0.008279800415039062, -0.007878780364990234, -0.007477760314941406, -0.007076740264892578, -0.00667572021484375, -0.006274700164794922, -0.005873680114746094, -0.005472660064697266, -0.0050716400146484375, -0.004670619964599609, -0.004269599914550781, -0.003868579864501953, -0.003467559814453125, -0.003066539764404297, -0.0026655197143554688, -0.0022644996643066406, -0.0018634796142578125, -0.0014624595642089844, -0.0010614395141601562, -0.0006604194641113281, -0.0002593994140625, 0.00014162063598632812, 0.0005426406860351562, 0.0009436607360839844, 0.0013446807861328125, 0.0017457008361816406, 0.0021467208862304688, 0.002547740936279297, 0.002948760986328125, 0.003349781036376953, 0.0037508010864257812, 0.004151821136474609, 0.0045528411865234375, 0.004953861236572266, 0.005354881286621094, 0.005755901336669922, 0.00615692138671875, 0.006557941436767578, 0.006958961486816406, 0.007359981536865234, 0.0077610015869140625, 0.00816202163696289, 0.008563041687011719, 0.008964061737060547, 0.009365081787109375, 0.009766101837158203, 0.010167121887207031, 0.01056814193725586, 0.010969161987304688, 0.011370182037353516, 0.011771202087402344, 0.012172222137451172, 0.0125732421875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 51.0, 293.0, 521.0, 139.0, 9.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016973786987364292, -0.0016648794990032911, -0.001632380299270153, -0.001599881099537015, -0.0015673818998038769, -0.0015348827000707388, -0.0015023835003376007, -0.0014698843006044626, -0.0014373851008713245, -0.0014048859011381865, -0.0013723867014050484, -0.0013398875016719103, -0.0013073883019387722, -0.0012748891022056341, -0.001242389902472496, -0.001209890702739358, -0.0011773915030062199, -0.0011448923032730818, -0.0011123931035399437, -0.0010798939038068056, -0.0010473947040736675, -0.0010148955043405294, -0.0009823963046073914, -0.0009498971048742533, -0.0009173977887257934, -0.0008848985889926553, -0.0008523993892595172, -0.0008199001895263791, -0.000787400989793241, -0.0007549017900601029, -0.0007224025903269649, -0.0006899033905938268, -0.0006574042490683496, -0.0006249050493352115, -0.0005924058496020734, -0.0005599066498689353, -0.0005274074501357973, -0.0004949082504026592, -0.00046240902156569064, -0.00042990982183255255, -0.00039741062209941447, -0.0003649114223662764, -0.0003324122226331383, -0.00029991299379616976, -0.0002674137940630317, -0.00023491460888180882, -0.0002024153945967555, -0.00016991619486361742, -0.00013741699513047934, -0.00010491779539734125, -7.241858838824555e-05, -3.9919381379149854e-05, -7.42018164601177e-06, 2.5079018087126315e-05, 5.757823237217963e-05, 9.007743210531771e-05, 0.0001225766318384558, 0.00015507583157159388, 0.00018757503130473197, 0.00022007424558978528, 0.0002525734598748386, 0.0002850726596079767, 0.00031757185934111476, 0.00035007105907425284, 0.00038257025880739093]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 10.0, 6.0, 4.0, 12.0, 9.0, 11.0, 14.0, 14.0, 32.0, 19.0, 25.0, 16.0, 35.0, 32.0, 31.0, 35.0, 38.0, 44.0, 43.0, 39.0, 40.0, 36.0, 38.0, 48.0, 42.0, 35.0, 24.0, 30.0, 32.0, 34.0, 25.0, 19.0, 15.0, 18.0, 18.0, 11.0, 17.0, 7.0, 5.0, 8.0, 6.0, 3.0, 6.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-0.00025659799575805664, -0.0002488205209374428, -0.00024104304611682892, -0.00023326557129621506, -0.0002254880964756012, -0.00021771062165498734, -0.00020993314683437347, -0.0002021556720137596, -0.00019437819719314575, -0.0001866007223725319, -0.00017882324755191803, -0.00017104577273130417, -0.0001632682979106903, -0.00015549082309007645, -0.00014771334826946259, -0.00013993587344884872, -0.00013215839862823486, -0.000124380923807621, -0.00011660344898700714, -0.00010882597416639328, -0.00010104849934577942, -9.327102452516556e-05, -8.54935497045517e-05, -7.771607488393784e-05, -6.993860006332397e-05, -6.216112524271011e-05, -5.438365042209625e-05, -4.660617560148239e-05, -3.882870078086853e-05, -3.105122596025467e-05, -2.3273751139640808e-05, -1.5496276319026947e-05, -7.718801498413086e-06, 5.8673322200775146e-08, 7.836148142814636e-06, 1.5613622963428497e-05, 2.339109778404236e-05, 3.116857260465622e-05, 3.894604742527008e-05, 4.672352224588394e-05, 5.45009970664978e-05, 6.227847188711166e-05, 7.005594670772552e-05, 7.783342152833939e-05, 8.561089634895325e-05, 9.338837116956711e-05, 0.00010116584599018097, 0.00010894332081079483, 0.00011672079563140869, 0.00012449827045202255, 0.00013227574527263641, 0.00014005322009325027, 0.00014783069491386414, 0.000155608169734478, 0.00016338564455509186, 0.00017116311937570572, 0.00017894059419631958, 0.00018671806901693344, 0.0001944955438375473, 0.00020227301865816116, 0.00021005049347877502, 0.00021782796829938889, 0.00022560544312000275, 0.0002333829179406166, 0.00024116039276123047]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 4.0, 8.0, 11.0, 5.0, 12.0, 9.0, 8.0, 9.0, 12.0, 20.0, 16.0, 18.0, 26.0, 40.0, 24.0, 26.0, 35.0, 36.0, 43.0, 23.0, 38.0, 36.0, 35.0, 40.0, 41.0, 39.0, 27.0, 38.0, 37.0, 36.0, 29.0, 30.0, 20.0, 21.0, 20.0, 14.0, 14.0, 15.0, 13.0, 9.0, 10.0, 8.0, 12.0, 11.0, 6.0, 1.0, 5.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-3.412109375, -3.3017578125, -3.19140625, -3.0810546875, -2.970703125, -2.8603515625, -2.75, -2.6396484375, -2.529296875, -2.4189453125, -2.30859375, -2.1982421875, -2.087890625, -1.9775390625, -1.8671875, -1.7568359375, -1.646484375, -1.5361328125, -1.42578125, -1.3154296875, -1.205078125, -1.0947265625, -0.984375, -0.8740234375, -0.763671875, -0.6533203125, -0.54296875, -0.4326171875, -0.322265625, -0.2119140625, -0.1015625, 0.0087890625, 0.119140625, 0.2294921875, 0.33984375, 0.4501953125, 0.560546875, 0.6708984375, 0.78125, 0.8916015625, 1.001953125, 1.1123046875, 1.22265625, 1.3330078125, 1.443359375, 1.5537109375, 1.6640625, 1.7744140625, 1.884765625, 1.9951171875, 2.10546875, 2.2158203125, 2.326171875, 2.4365234375, 2.546875, 2.6572265625, 2.767578125, 2.8779296875, 2.98828125, 3.0986328125, 3.208984375, 3.3193359375, 3.4296875, 3.5400390625, 3.650390625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 0.0, 3.0, 5.0, 4.0, 7.0, 5.0, 5.0, 18.0, 16.0, 19.0, 31.0, 37.0, 41.0, 56.0, 73.0, 100.0, 135.0, 172.0, 249.0, 382.0, 545.0, 916.0, 1488.0, 2848.0, 6023.0, 13934.0, 35100.0, 99543.0, 313955.0, 377556.0, 122016.0, 41963.0, 16336.0, 7042.0, 3328.0, 1660.0, 924.0, 600.0, 380.0, 266.0, 207.0, 129.0, 95.0, 89.0, 60.0, 43.0, 39.0, 31.0, 28.0, 13.0, 18.0, 5.0, 3.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.232421875, -3.125, -3.017578125, -2.91015625, -2.802734375, -2.6953125, -2.587890625, -2.48046875, -2.373046875, -2.265625, -2.158203125, -2.05078125, -1.943359375, -1.8359375, -1.728515625, -1.62109375, -1.513671875, -1.40625, -1.298828125, -1.19140625, -1.083984375, -0.9765625, -0.869140625, -0.76171875, -0.654296875, -0.546875, -0.439453125, -0.33203125, -0.224609375, -0.1171875, -0.009765625, 0.09765625, 0.205078125, 0.3125, 0.419921875, 0.52734375, 0.634765625, 0.7421875, 0.849609375, 0.95703125, 1.064453125, 1.171875, 1.279296875, 1.38671875, 1.494140625, 1.6015625, 1.708984375, 1.81640625, 1.923828125, 2.03125, 2.138671875, 2.24609375, 2.353515625, 2.4609375, 2.568359375, 2.67578125, 2.783203125, 2.890625, 2.998046875, 3.10546875, 3.212890625, 3.3203125, 3.427734375, 3.53515625, 3.642578125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 8.0, 11.0, 8.0, 17.0, 13.0, 22.0, 18.0, 26.0, 25.0, 31.0, 36.0, 32.0, 39.0, 49.0, 44.0, 79.0, 191.0, 1685.0, 194.0, 79.0, 49.0, 49.0, 34.0, 44.0, 22.0, 31.0, 27.0, 29.0, 19.0, 19.0, 11.0, 15.0, 13.0, 9.0, 9.0, 10.0, 8.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.0234375, -11.586181640625, -11.14892578125, -10.711669921875, -10.2744140625, -9.837158203125, -9.39990234375, -8.962646484375, -8.525390625, -8.088134765625, -7.65087890625, -7.213623046875, -6.7763671875, -6.339111328125, -5.90185546875, -5.464599609375, -5.02734375, -4.590087890625, -4.15283203125, -3.715576171875, -3.2783203125, -2.841064453125, -2.40380859375, -1.966552734375, -1.529296875, -1.092041015625, -0.65478515625, -0.217529296875, 0.2197265625, 0.656982421875, 1.09423828125, 1.531494140625, 1.96875, 2.406005859375, 2.84326171875, 3.280517578125, 3.7177734375, 4.155029296875, 4.59228515625, 5.029541015625, 5.466796875, 5.904052734375, 6.34130859375, 6.778564453125, 7.2158203125, 7.653076171875, 8.09033203125, 8.527587890625, 8.96484375, 9.402099609375, 9.83935546875, 10.276611328125, 10.7138671875, 11.151123046875, 11.58837890625, 12.025634765625, 12.462890625, 12.900146484375, 13.33740234375, 13.774658203125, 14.2119140625, 14.649169921875, 15.08642578125, 15.523681640625, 15.9609375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 6.0, 5.0, 9.0, 13.0, 7.0, 14.0, 12.0, 14.0, 17.0, 19.0, 31.0, 26.0, 24.0, 53.0, 63.0, 81.0, 132.0, 265.0, 638.0, 2825.0, 2660308.0, 477798.0, 2059.0, 539.0, 228.0, 140.0, 72.0, 44.0, 61.0, 35.0, 30.0, 18.0, 22.0, 16.0, 17.0, 12.0, 11.0, 9.0, 9.0, 3.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0], "bins": [-37.46875, -36.4541015625, -35.439453125, -34.4248046875, -33.41015625, -32.3955078125, -31.380859375, -30.3662109375, -29.3515625, -28.3369140625, -27.322265625, -26.3076171875, -25.29296875, -24.2783203125, -23.263671875, -22.2490234375, -21.234375, -20.2197265625, -19.205078125, -18.1904296875, -17.17578125, -16.1611328125, -15.146484375, -14.1318359375, -13.1171875, -12.1025390625, -11.087890625, -10.0732421875, -9.05859375, -8.0439453125, -7.029296875, -6.0146484375, -5.0, -3.9853515625, -2.970703125, -1.9560546875, -0.94140625, 0.0732421875, 1.087890625, 2.1025390625, 3.1171875, 4.1318359375, 5.146484375, 6.1611328125, 7.17578125, 8.1904296875, 9.205078125, 10.2197265625, 11.234375, 12.2490234375, 13.263671875, 14.2783203125, 15.29296875, 16.3076171875, 17.322265625, 18.3369140625, 19.3515625, 20.3662109375, 21.380859375, 22.3955078125, 23.41015625, 24.4248046875, 25.439453125, 26.4541015625, 27.46875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 273.0, 730.0, 12.0, 1.0], "bins": [-210.92942810058594, -207.4821014404297, -204.03475952148438, -200.58743286132812, -197.14010620117188, -193.69277954101562, -190.2454376220703, -186.79811096191406, -183.3507843017578, -179.90345764160156, -176.45611572265625, -173.0087890625, -169.56146240234375, -166.1141357421875, -162.6667938232422, -159.21946716308594, -155.77212524414062, -152.32479858398438, -148.87745666503906, -145.4301300048828, -141.98280334472656, -138.5354766845703, -135.088134765625, -131.64080810546875, -128.1934814453125, -124.74614715576172, -121.29882049560547, -117.85148620605469, -114.40415954589844, -110.95682525634766, -107.50949096679688, -104.06216430664062, -100.6148452758789, -97.16751098632812, -93.72018432617188, -90.2728500366211, -86.82552337646484, -83.37818908691406, -79.93086242675781, -76.48352813720703, -73.03619384765625, -69.58885955810547, -66.14153289794922, -62.69419860839844, -59.24687194824219, -55.799537658691406, -52.35220718383789, -48.904876708984375, -45.45754623413086, -42.010215759277344, -38.56288528442383, -35.11555480957031, -31.668222427368164, -28.22089195251465, -24.7735595703125, -21.326229095458984, -17.87889862060547, -14.431568145751953, -10.984236717224121, -7.536905288696289, -4.089574813842773, -0.6422443389892578, 2.8050880432128906, 6.252418518066406, 9.699748039245605]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 5.0, 7.0, 9.0, 9.0, 11.0, 15.0, 16.0, 20.0, 19.0, 29.0, 29.0, 33.0, 34.0, 27.0, 35.0, 45.0, 37.0, 33.0, 35.0, 33.0, 44.0, 39.0, 39.0, 30.0, 30.0, 43.0, 38.0, 33.0, 21.0, 23.0, 21.0, 25.0, 19.0, 18.0, 17.0, 16.0, 16.0, 6.0, 8.0, 7.0, 3.0, 7.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.838592529296875, -38.5027961730957, -37.16699981689453, -35.831207275390625, -34.49541091918945, -33.15961456298828, -31.82381820678711, -30.488021850585938, -29.1522274017334, -27.816431045532227, -26.480636596679688, -25.144840240478516, -23.809043884277344, -22.473249435424805, -21.137453079223633, -19.801658630371094, -18.465862274169922, -17.13006591796875, -15.794271469116211, -14.458475112915039, -13.122679710388184, -11.786884307861328, -10.451087951660156, -9.1152925491333, -7.779497146606445, -6.44370174407959, -5.107905864715576, -3.7721099853515625, -2.436314582824707, -1.1005191802978516, 0.2352771759033203, 1.5710725784301758, 2.9068679809570312, 4.242663383483887, 5.5784592628479, 6.914255142211914, 8.25005054473877, 9.585845947265625, 10.921642303466797, 12.257437705993652, 13.593233108520508, 14.929028511047363, 16.26482391357422, 17.60062026977539, 18.936416625976562, 20.2722110748291, 21.608007431030273, 22.943801879882812, 24.279598236083984, 25.615394592285156, 26.951189041137695, 28.286985397338867, 29.622779846191406, 30.958576202392578, 32.29437255859375, 33.63016891479492, 34.965965270996094, 36.301761627197266, 37.63755798339844, 38.973350524902344, 40.309146881103516, 41.64494323730469, 42.98073959350586, 44.31653594970703, 45.65232849121094]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 0.0, 4.0, 5.0, 2.0, 8.0, 11.0, 11.0, 5.0, 7.0, 15.0, 7.0, 11.0, 16.0, 23.0, 24.0, 30.0, 29.0, 36.0, 29.0, 30.0, 35.0, 41.0, 38.0, 36.0, 36.0, 29.0, 45.0, 44.0, 36.0, 34.0, 33.0, 34.0, 36.0, 32.0, 18.0, 24.0, 23.0, 14.0, 18.0, 13.0, 11.0, 11.0, 8.0, 12.0, 8.0, 10.0, 10.0, 6.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.765625, -3.64947509765625, -3.5333251953125, -3.41717529296875, -3.301025390625, -3.18487548828125, -3.0687255859375, -2.95257568359375, -2.83642578125, -2.72027587890625, -2.6041259765625, -2.48797607421875, -2.371826171875, -2.25567626953125, -2.1395263671875, -2.02337646484375, -1.9072265625, -1.79107666015625, -1.6749267578125, -1.55877685546875, -1.442626953125, -1.32647705078125, -1.2103271484375, -1.09417724609375, -0.97802734375, -0.86187744140625, -0.7457275390625, -0.62957763671875, -0.513427734375, -0.39727783203125, -0.2811279296875, -0.16497802734375, -0.048828125, 0.06732177734375, 0.1834716796875, 0.29962158203125, 0.415771484375, 0.53192138671875, 0.6480712890625, 0.76422119140625, 0.88037109375, 0.99652099609375, 1.1126708984375, 1.22882080078125, 1.344970703125, 1.46112060546875, 1.5772705078125, 1.69342041015625, 1.8095703125, 1.92572021484375, 2.0418701171875, 2.15802001953125, 2.274169921875, 2.39031982421875, 2.5064697265625, 2.62261962890625, 2.73876953125, 2.85491943359375, 2.9710693359375, 3.08721923828125, 3.203369140625, 3.31951904296875, 3.4356689453125, 3.55181884765625, 3.66796875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 8.0, 5.0, 19.0, 13.0, 17.0, 28.0, 21.0, 31.0, 34.0, 64.0, 80.0, 116.0, 194.0, 381.0, 1227.0, 7730.0, 134254.0, 3103720.0, 916344.0, 25902.0, 2645.0, 622.0, 281.0, 151.0, 83.0, 77.0, 41.0, 43.0, 25.0, 29.0, 19.0, 11.0, 11.0, 11.0, 7.0, 5.0, 11.0, 5.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.114501953125, -15.57275390625, -15.031005859375, -14.4892578125, -13.947509765625, -13.40576171875, -12.864013671875, -12.322265625, -11.780517578125, -11.23876953125, -10.697021484375, -10.1552734375, -9.613525390625, -9.07177734375, -8.530029296875, -7.98828125, -7.446533203125, -6.90478515625, -6.363037109375, -5.8212890625, -5.279541015625, -4.73779296875, -4.196044921875, -3.654296875, -3.112548828125, -2.57080078125, -2.029052734375, -1.4873046875, -0.945556640625, -0.40380859375, 0.137939453125, 0.6796875, 1.221435546875, 1.76318359375, 2.304931640625, 2.8466796875, 3.388427734375, 3.93017578125, 4.471923828125, 5.013671875, 5.555419921875, 6.09716796875, 6.638916015625, 7.1806640625, 7.722412109375, 8.26416015625, 8.805908203125, 9.34765625, 9.889404296875, 10.43115234375, 10.972900390625, 11.5146484375, 12.056396484375, 12.59814453125, 13.139892578125, 13.681640625, 14.223388671875, 14.76513671875, 15.306884765625, 15.8486328125, 16.390380859375, 16.93212890625, 17.473876953125, 18.015625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 15.0, 29.0, 41.0, 44.0, 73.0, 117.0, 181.0, 266.0, 442.0, 539.0, 640.0, 494.0, 379.0, 262.0, 188.0, 120.0, 77.0, 52.0, 33.0, 14.0, 16.0, 16.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.546875, -19.9658203125, -19.384765625, -18.8037109375, -18.22265625, -17.6416015625, -17.060546875, -16.4794921875, -15.8984375, -15.3173828125, -14.736328125, -14.1552734375, -13.57421875, -12.9931640625, -12.412109375, -11.8310546875, -11.25, -10.6689453125, -10.087890625, -9.5068359375, -8.92578125, -8.3447265625, -7.763671875, -7.1826171875, -6.6015625, -6.0205078125, -5.439453125, -4.8583984375, -4.27734375, -3.6962890625, -3.115234375, -2.5341796875, -1.953125, -1.3720703125, -0.791015625, -0.2099609375, 0.37109375, 0.9521484375, 1.533203125, 2.1142578125, 2.6953125, 3.2763671875, 3.857421875, 4.4384765625, 5.01953125, 5.6005859375, 6.181640625, 6.7626953125, 7.34375, 7.9248046875, 8.505859375, 9.0869140625, 9.66796875, 10.2490234375, 10.830078125, 11.4111328125, 11.9921875, 12.5732421875, 13.154296875, 13.7353515625, 14.31640625, 14.8974609375, 15.478515625, 16.0595703125, 16.640625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 7.0, 12.0, 12.0, 22.0, 32.0, 47.0, 74.0, 117.0, 179.0, 344.0, 785.0, 7653.0, 3827827.0, 353859.0, 2163.0, 521.0, 239.0, 136.0, 89.0, 58.0, 39.0, 13.0, 16.0, 13.0, 5.0, 3.0, 2.0, 4.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.40625, -59.34619140625, -57.2861328125, -55.22607421875, -53.166015625, -51.10595703125, -49.0458984375, -46.98583984375, -44.92578125, -42.86572265625, -40.8056640625, -38.74560546875, -36.685546875, -34.62548828125, -32.5654296875, -30.50537109375, -28.4453125, -26.38525390625, -24.3251953125, -22.26513671875, -20.205078125, -18.14501953125, -16.0849609375, -14.02490234375, -11.96484375, -9.90478515625, -7.8447265625, -5.78466796875, -3.724609375, -1.66455078125, 0.3955078125, 2.45556640625, 4.515625, 6.57568359375, 8.6357421875, 10.69580078125, 12.755859375, 14.81591796875, 16.8759765625, 18.93603515625, 20.99609375, 23.05615234375, 25.1162109375, 27.17626953125, 29.236328125, 31.29638671875, 33.3564453125, 35.41650390625, 37.4765625, 39.53662109375, 41.5966796875, 43.65673828125, 45.716796875, 47.77685546875, 49.8369140625, 51.89697265625, 53.95703125, 56.01708984375, 58.0771484375, 60.13720703125, 62.197265625, 64.25732421875, 66.3173828125, 68.37744140625, 70.4375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 63.0, 750.0, 202.0, 4.0, 0.0, 1.0], "bins": [-625.9633178710938, -615.465576171875, -604.9678955078125, -594.4701538085938, -583.972412109375, -573.4747314453125, -562.9769897460938, -552.479248046875, -541.9815063476562, -531.4837646484375, -520.986083984375, -510.48834228515625, -499.9906005859375, -489.4928894042969, -478.99517822265625, -468.4974365234375, -457.999755859375, -447.5020446777344, -437.0043029785156, -426.506591796875, -416.00885009765625, -405.5111389160156, -395.013427734375, -384.51568603515625, -374.0179443359375, -363.5202331542969, -353.0224914550781, -342.5247802734375, -332.02703857421875, -321.5293273925781, -311.0316162109375, -300.53387451171875, -290.0361328125, -279.5384216308594, -269.0406799316406, -258.54296875, -248.0452423095703, -237.54751586914062, -227.04978942871094, -216.55206298828125, -206.05435180664062, -195.55662536621094, -185.05889892578125, -174.56118774414062, -164.06346130371094, -153.56573486328125, -143.06800842285156, -132.57028198242188, -122.07257080078125, -111.57484436035156, -101.0771255493164, -90.57939910888672, -80.08168029785156, -69.58395385742188, -59.08622741699219, -48.58850860595703, -38.09077835083008, -27.593055725097656, -17.0953311920166, -6.597606658935547, 3.900115966796875, 14.397838592529297, 24.895565032958984, 35.39328384399414, 45.89101028442383]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 11.0, 6.0, 9.0, 10.0, 13.0, 22.0, 11.0, 24.0, 23.0, 25.0, 24.0, 30.0, 25.0, 35.0, 47.0, 33.0, 34.0, 35.0, 49.0, 44.0, 35.0, 43.0, 44.0, 45.0, 39.0, 30.0, 29.0, 31.0, 30.0, 21.0, 22.0, 20.0, 14.0, 24.0, 11.0, 15.0, 5.0, 9.0, 10.0, 2.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-47.733917236328125, -46.17435073852539, -44.614784240722656, -43.055213928222656, -41.49564743041992, -39.93608093261719, -38.37651443481445, -36.81694793701172, -35.25737762451172, -33.697811126708984, -32.13824462890625, -30.578676223754883, -29.019107818603516, -27.45954132080078, -25.899974822998047, -24.340408325195312, -22.780841827392578, -21.221275329589844, -19.661706924438477, -18.102140426635742, -16.542572021484375, -14.98300552368164, -13.423439025878906, -11.863871574401855, -10.304304122924805, -8.744736671447754, -7.185169696807861, -5.625602722167969, -4.066035270690918, -2.506467819213867, -0.9469013214111328, 0.612666130065918, 2.1722335815429688, 3.7318007946014404, 5.291368007659912, 6.850934982299805, 8.410502433776855, 9.970069885253906, 11.52963638305664, 13.089203834533691, 14.648771286010742, 16.208337783813477, 17.767906188964844, 19.327472686767578, 20.887039184570312, 22.44660758972168, 24.006174087524414, 25.56574249267578, 27.125308990478516, 28.68487548828125, 30.244443893432617, 31.80401039123535, 33.36357879638672, 34.92314529418945, 36.48271179199219, 38.04227828979492, 39.601844787597656, 41.16141128540039, 42.720977783203125, 44.280548095703125, 45.84011459350586, 47.399681091308594, 48.95924758911133, 50.51881408691406, 52.07838439941406]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 1.0, 5.0, 6.0, 6.0, 7.0, 8.0, 12.0, 8.0, 12.0, 15.0, 22.0, 23.0, 21.0, 17.0, 23.0, 38.0, 38.0, 39.0, 34.0, 37.0, 40.0, 24.0, 36.0, 40.0, 43.0, 39.0, 41.0, 37.0, 30.0, 30.0, 26.0, 28.0, 26.0, 19.0, 22.0, 29.0, 25.0, 16.0, 13.0, 11.0, 11.0, 9.0, 12.0, 9.0, 3.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.607421875, -3.485076904296875, -3.36273193359375, -3.240386962890625, -3.1180419921875, -2.995697021484375, -2.87335205078125, -2.751007080078125, -2.628662109375, -2.506317138671875, -2.38397216796875, -2.261627197265625, -2.1392822265625, -2.016937255859375, -1.89459228515625, -1.772247314453125, -1.64990234375, -1.527557373046875, -1.40521240234375, -1.282867431640625, -1.1605224609375, -1.038177490234375, -0.91583251953125, -0.793487548828125, -0.671142578125, -0.548797607421875, -0.42645263671875, -0.304107666015625, -0.1817626953125, -0.059417724609375, 0.06292724609375, 0.185272216796875, 0.3076171875, 0.429962158203125, 0.55230712890625, 0.674652099609375, 0.7969970703125, 0.919342041015625, 1.04168701171875, 1.164031982421875, 1.286376953125, 1.408721923828125, 1.53106689453125, 1.653411865234375, 1.7757568359375, 1.898101806640625, 2.02044677734375, 2.142791748046875, 2.26513671875, 2.387481689453125, 2.50982666015625, 2.632171630859375, 2.7545166015625, 2.876861572265625, 2.99920654296875, 3.121551513671875, 3.243896484375, 3.366241455078125, 3.48858642578125, 3.610931396484375, 3.7332763671875, 3.855621337890625, 3.97796630859375, 4.100311279296875, 4.22265625]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 12.0, 22.0, 22.0, 46.0, 59.0, 102.0, 146.0, 177.0, 303.0, 477.0, 725.0, 1060.0, 1588.0, 2359.0, 3474.0, 5244.0, 7995.0, 12159.0, 18648.0, 29473.0, 47707.0, 82005.0, 155317.0, 314208.0, 153254.0, 81093.0, 47581.0, 29211.0, 18489.0, 12061.0, 7754.0, 5256.0, 3429.0, 2342.0, 1606.0, 991.0, 744.0, 490.0, 291.0, 244.0, 130.0, 83.0, 71.0, 37.0, 18.0, 14.0, 13.0, 10.0, 8.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.90478515625, -0.8769378662109375, -0.849090576171875, -0.8212432861328125, -0.79339599609375, -0.7655487060546875, -0.737701416015625, -0.7098541259765625, -0.6820068359375, -0.6541595458984375, -0.626312255859375, -0.5984649658203125, -0.57061767578125, -0.5427703857421875, -0.514923095703125, -0.4870758056640625, -0.459228515625, -0.4313812255859375, -0.403533935546875, -0.3756866455078125, -0.34783935546875, -0.3199920654296875, -0.292144775390625, -0.2642974853515625, -0.2364501953125, -0.2086029052734375, -0.180755615234375, -0.1529083251953125, -0.12506103515625, -0.0972137451171875, -0.069366455078125, -0.0415191650390625, -0.013671875, 0.0141754150390625, 0.042022705078125, 0.0698699951171875, 0.09771728515625, 0.1255645751953125, 0.153411865234375, 0.1812591552734375, 0.2091064453125, 0.2369537353515625, 0.264801025390625, 0.2926483154296875, 0.32049560546875, 0.3483428955078125, 0.376190185546875, 0.4040374755859375, 0.431884765625, 0.4597320556640625, 0.487579345703125, 0.5154266357421875, 0.54327392578125, 0.5711212158203125, 0.598968505859375, 0.6268157958984375, 0.6546630859375, 0.6825103759765625, 0.710357666015625, 0.7382049560546875, 0.76605224609375, 0.7938995361328125, 0.821746826171875, 0.8495941162109375, 0.87744140625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 6.0, 4.0, 8.0, 15.0, 19.0, 14.0, 19.0, 18.0, 19.0, 24.0, 29.0, 39.0, 40.0, 27.0, 42.0, 45.0, 52.0, 37.0, 1057.0, 41.0, 44.0, 41.0, 36.0, 47.0, 41.0, 40.0, 22.0, 27.0, 22.0, 30.0, 20.0, 15.0, 16.0, 14.0, 10.0, 4.0, 9.0, 5.0, 7.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.865234375, -2.78009033203125, -2.6949462890625, -2.60980224609375, -2.524658203125, -2.43951416015625, -2.3543701171875, -2.26922607421875, -2.18408203125, -2.09893798828125, -2.0137939453125, -1.92864990234375, -1.843505859375, -1.75836181640625, -1.6732177734375, -1.58807373046875, -1.5029296875, -1.41778564453125, -1.3326416015625, -1.24749755859375, -1.162353515625, -1.07720947265625, -0.9920654296875, -0.90692138671875, -0.82177734375, -0.73663330078125, -0.6514892578125, -0.56634521484375, -0.481201171875, -0.39605712890625, -0.3109130859375, -0.22576904296875, -0.140625, -0.05548095703125, 0.0296630859375, 0.11480712890625, 0.199951171875, 0.28509521484375, 0.3702392578125, 0.45538330078125, 0.54052734375, 0.62567138671875, 0.7108154296875, 0.79595947265625, 0.881103515625, 0.96624755859375, 1.0513916015625, 1.13653564453125, 1.2216796875, 1.30682373046875, 1.3919677734375, 1.47711181640625, 1.562255859375, 1.64739990234375, 1.7325439453125, 1.81768798828125, 1.90283203125, 1.98797607421875, 2.0731201171875, 2.15826416015625, 2.243408203125, 2.32855224609375, 2.4136962890625, 2.49884033203125, 2.583984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 2.0, 7.0, 5.0, 10.0, 11.0, 21.0, 28.0, 51.0, 73.0, 127.0, 225.0, 381.0, 674.0, 1258.0, 2331.0, 4520.0, 8611.0, 17369.0, 36078.0, 80013.0, 221953.0, 1481098.0, 133844.0, 55731.0, 26079.0, 12618.0, 6542.0, 3402.0, 1781.0, 960.0, 551.0, 298.0, 196.0, 103.0, 58.0, 47.0, 26.0, 13.0, 6.0, 9.0, 6.0, 4.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.25390625, -1.212493896484375, -1.17108154296875, -1.129669189453125, -1.0882568359375, -1.046844482421875, -1.00543212890625, -0.964019775390625, -0.922607421875, -0.881195068359375, -0.83978271484375, -0.798370361328125, -0.7569580078125, -0.715545654296875, -0.67413330078125, -0.632720947265625, -0.59130859375, -0.549896240234375, -0.50848388671875, -0.467071533203125, -0.4256591796875, -0.384246826171875, -0.34283447265625, -0.301422119140625, -0.260009765625, -0.218597412109375, -0.17718505859375, -0.135772705078125, -0.0943603515625, -0.052947998046875, -0.01153564453125, 0.029876708984375, 0.0712890625, 0.112701416015625, 0.15411376953125, 0.195526123046875, 0.2369384765625, 0.278350830078125, 0.31976318359375, 0.361175537109375, 0.402587890625, 0.444000244140625, 0.48541259765625, 0.526824951171875, 0.5682373046875, 0.609649658203125, 0.65106201171875, 0.692474365234375, 0.73388671875, 0.775299072265625, 0.81671142578125, 0.858123779296875, 0.8995361328125, 0.940948486328125, 0.98236083984375, 1.023773193359375, 1.065185546875, 1.106597900390625, 1.14801025390625, 1.189422607421875, 1.2308349609375, 1.272247314453125, 1.31365966796875, 1.355072021484375, 1.396484375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 4.0, 3.0, 10.0, 6.0, 10.0, 12.0, 21.0, 17.0, 18.0, 24.0, 32.0, 33.0, 45.0, 44.0, 60.0, 69.0, 68.0, 66.0, 70.0, 58.0, 47.0, 53.0, 42.0, 37.0, 31.0, 21.0, 22.0, 12.0, 16.0, 12.0, 12.0, 6.0, 6.0, 8.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007085800170898438, -0.0006885379552841187, -0.0006684958934783936, -0.0006484538316726685, -0.0006284117698669434, -0.0006083697080612183, -0.0005883276462554932, -0.0005682855844497681, -0.000548243522644043, -0.0005282014608383179, -0.0005081593990325928, -0.0004881173372268677, -0.0004680752754211426, -0.0004480332136154175, -0.0004279911518096924, -0.0004079490900039673, -0.0003879070281982422, -0.0003678649663925171, -0.000347822904586792, -0.0003277808427810669, -0.0003077387809753418, -0.0002876967191696167, -0.0002676546573638916, -0.0002476125955581665, -0.0002275705337524414, -0.0002075284719467163, -0.0001874864101409912, -0.0001674443483352661, -0.00014740228652954102, -0.00012736022472381592, -0.00010731816291809082, -8.727610111236572e-05, -6.723403930664062e-05, -4.719197750091553e-05, -2.714991569519043e-05, -7.107853889465332e-06, 1.2934207916259766e-05, 3.297626972198486e-05, 5.301833152770996e-05, 7.306039333343506e-05, 9.310245513916016e-05, 0.00011314451694488525, 0.00013318657875061035, 0.00015322864055633545, 0.00017327070236206055, 0.00019331276416778564, 0.00021335482597351074, 0.00023339688777923584, 0.00025343894958496094, 0.00027348101139068604, 0.00029352307319641113, 0.00031356513500213623, 0.00033360719680786133, 0.0003536492586135864, 0.0003736913204193115, 0.0003937333822250366, 0.0004137754440307617, 0.0004338175058364868, 0.0004538595676422119, 0.000473901629447937, 0.0004939436912536621, 0.0005139857530593872, 0.0005340278148651123, 0.0005540698766708374, 0.0005741119384765625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 6.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 11.0, 13.0, 2.0, 16.0, 16.0, 20.0, 24.0, 17.0, 39.0, 52.0, 59.0, 68.0, 91.0, 173.0, 209.0, 371.0, 964.0, 656924.0, 387356.0, 910.0, 383.0, 221.0, 127.0, 118.0, 89.0, 44.0, 41.0, 30.0, 24.0, 20.0, 25.0, 16.0, 15.0, 9.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01163482666015625, -0.011233210563659668, -0.010831594467163086, -0.010429978370666504, -0.010028362274169922, -0.00962674617767334, -0.009225130081176758, -0.008823513984680176, -0.008421897888183594, -0.008020281791687012, -0.00761866569519043, -0.007217049598693848, -0.006815433502197266, -0.006413817405700684, -0.0060122013092041016, -0.0056105852127075195, -0.0052089691162109375, -0.0048073530197143555, -0.0044057369232177734, -0.004004120826721191, -0.0036025047302246094, -0.0032008886337280273, -0.0027992725372314453, -0.0023976564407348633, -0.0019960403442382812, -0.0015944242477416992, -0.0011928081512451172, -0.0007911920547485352, -0.0003895759582519531, 1.2040138244628906e-05, 0.00041365623474121094, 0.000815272331237793, 0.001216888427734375, 0.001618504524230957, 0.002020120620727539, 0.002421736717224121, 0.002823352813720703, 0.003224968910217285, 0.003626585006713867, 0.004028201103210449, 0.004429817199707031, 0.004831433296203613, 0.005233049392700195, 0.005634665489196777, 0.006036281585693359, 0.006437897682189941, 0.0068395137786865234, 0.0072411298751831055, 0.0076427459716796875, 0.00804436206817627, 0.008445978164672852, 0.008847594261169434, 0.009249210357666016, 0.009650826454162598, 0.01005244255065918, 0.010454058647155762, 0.010855674743652344, 0.011257290840148926, 0.011658906936645508, 0.01206052303314209, 0.012462139129638672, 0.012863755226135254, 0.013265371322631836, 0.013666987419128418, 0.014068603515625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 44.0, 614.0, 347.0, 10.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007031603017821908, -0.0006316837971098721, -0.0005602072924375534, -0.0004887307877652347, -0.000417254283092916, -0.0003457777784205973, -0.0002743012737482786, -0.00020282476907595992, -0.00013134826440364122, -5.987175973132253e-05, 1.160474494099617e-05, 8.308124961331487e-05, 0.00015455775428563356, 0.00022603425895795226, 0.00029751076363027096, 0.00036898726830258965, 0.00044046377297490835, 0.000511940277647227, 0.0005834167823195457, 0.0006548932869918644, 0.0007263697916641831, 0.0007978462963365018, 0.0008693228010088205, 0.0009407993056811392, 0.001012275810353458, 0.0010837523732334375, 0.0011552288196980953, 0.001226705266162753, 0.0012981818290427327, 0.0013696583919227123, 0.0014411348383873701, 0.001512611284852028, 0.0015840879641473293, 0.0016555644106119871, 0.0017270409734919667, 0.0017985175363719463, 0.0018699939828366041, 0.001941470429301262, 0.0020129471085965633, 0.002084423555061221, 0.002155900001525879, 0.0022273764479905367, 0.0022988528944551945, 0.002370329573750496, 0.0024418060202151537, 0.0025132824666798115, 0.002584759145975113, 0.0026562355924397707, 0.0027277120389044285, 0.0027991884853690863, 0.002870664931833744, 0.0029421416111290455, 0.0030136180575937033, 0.003085094504058361, 0.0031565711833536625, 0.0032280476298183203, 0.003299524076282978, 0.003371000522747636, 0.0034424769692122936, 0.003513953648507595, 0.003585430094972253, 0.0036569065414369106, 0.003728383220732212, 0.00379985966719687, 0.0038713361136615276]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 7.0, 7.0, 9.0, 8.0, 8.0, 10.0, 13.0, 17.0, 14.0, 22.0, 11.0, 29.0, 32.0, 34.0, 21.0, 46.0, 33.0, 38.0, 36.0, 33.0, 37.0, 39.0, 35.0, 43.0, 40.0, 31.0, 35.0, 38.0, 35.0, 33.0, 41.0, 15.0, 20.0, 15.0, 15.0, 24.0, 14.0, 8.0, 12.0, 9.0, 8.0, 3.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027930736541748047, -0.0002703089267015457, -0.00026131048798561096, -0.0002523120492696762, -0.00024331361055374146, -0.0002343151718378067, -0.00022531673312187195, -0.0002163182944059372, -0.00020731985569000244, -0.0001983214169740677, -0.00018932297825813293, -0.00018032453954219818, -0.00017132610082626343, -0.00016232766211032867, -0.00015332922339439392, -0.00014433078467845917, -0.00013533234596252441, -0.00012633390724658966, -0.00011733546853065491, -0.00010833702981472015, -9.93385910987854e-05, -9.034015238285065e-05, -8.13417136669159e-05, -7.234327495098114e-05, -6.334483623504639e-05, -5.434639751911163e-05, -4.534795880317688e-05, -3.6349520087242126e-05, -2.7351081371307373e-05, -1.835264265537262e-05, -9.354203939437866e-06, -3.557652235031128e-07, 8.64267349243164e-06, 1.7641112208366394e-05, 2.6639550924301147e-05, 3.56379896402359e-05, 4.4636428356170654e-05, 5.363486707210541e-05, 6.263330578804016e-05, 7.163174450397491e-05, 8.063018321990967e-05, 8.962862193584442e-05, 9.862706065177917e-05, 0.00010762549936771393, 0.00011662393808364868, 0.00012562237679958344, 0.0001346208155155182, 0.00014361925423145294, 0.0001526176929473877, 0.00016161613166332245, 0.0001706145703792572, 0.00017961300909519196, 0.0001886114478111267, 0.00019760988652706146, 0.00020660832524299622, 0.00021560676395893097, 0.00022460520267486572, 0.00023360364139080048, 0.00024260208010673523, 0.00025160051882267, 0.00026059895753860474, 0.0002695973962545395, 0.00027859583497047424, 0.000287594273686409, 0.00029659271240234375]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 1.0, 5.0, 6.0, 6.0, 7.0, 8.0, 12.0, 8.0, 12.0, 15.0, 22.0, 23.0, 21.0, 17.0, 23.0, 38.0, 38.0, 39.0, 34.0, 37.0, 40.0, 24.0, 36.0, 40.0, 43.0, 39.0, 41.0, 37.0, 30.0, 30.0, 26.0, 28.0, 26.0, 19.0, 22.0, 29.0, 25.0, 16.0, 13.0, 11.0, 11.0, 9.0, 12.0, 9.0, 3.0, 1.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.607421875, -3.485076904296875, -3.36273193359375, -3.240386962890625, -3.1180419921875, -2.995697021484375, -2.87335205078125, -2.751007080078125, -2.628662109375, -2.506317138671875, -2.38397216796875, -2.261627197265625, -2.1392822265625, -2.016937255859375, -1.89459228515625, -1.772247314453125, -1.64990234375, -1.527557373046875, -1.40521240234375, -1.282867431640625, -1.1605224609375, -1.038177490234375, -0.91583251953125, -0.793487548828125, -0.671142578125, -0.548797607421875, -0.42645263671875, -0.304107666015625, -0.1817626953125, -0.059417724609375, 0.06292724609375, 0.185272216796875, 0.3076171875, 0.429962158203125, 0.55230712890625, 0.674652099609375, 0.7969970703125, 0.919342041015625, 1.04168701171875, 1.164031982421875, 1.286376953125, 1.408721923828125, 1.53106689453125, 1.653411865234375, 1.7757568359375, 1.898101806640625, 2.02044677734375, 2.142791748046875, 2.26513671875, 2.387481689453125, 2.50982666015625, 2.632171630859375, 2.7545166015625, 2.876861572265625, 2.99920654296875, 3.121551513671875, 3.243896484375, 3.366241455078125, 3.48858642578125, 3.610931396484375, 3.7332763671875, 3.855621337890625, 3.97796630859375, 4.100311279296875, 4.22265625]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 6.0, 10.0, 10.0, 14.0, 20.0, 20.0, 39.0, 54.0, 63.0, 90.0, 94.0, 137.0, 204.0, 277.0, 338.0, 519.0, 722.0, 980.0, 1664.0, 2577.0, 4580.0, 8532.0, 18003.0, 42269.0, 108579.0, 308918.0, 340380.0, 121038.0, 46423.0, 19756.0, 9244.0, 4741.0, 2701.0, 1720.0, 1122.0, 745.0, 546.0, 362.0, 308.0, 198.0, 157.0, 99.0, 93.0, 51.0, 37.0, 32.0, 34.0, 13.0, 16.0, 8.0, 5.0, 5.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.59375, -2.510223388671875, -2.42669677734375, -2.343170166015625, -2.2596435546875, -2.176116943359375, -2.09259033203125, -2.009063720703125, -1.925537109375, -1.842010498046875, -1.75848388671875, -1.674957275390625, -1.5914306640625, -1.507904052734375, -1.42437744140625, -1.340850830078125, -1.25732421875, -1.173797607421875, -1.09027099609375, -1.006744384765625, -0.9232177734375, -0.839691162109375, -0.75616455078125, -0.672637939453125, -0.589111328125, -0.505584716796875, -0.42205810546875, -0.338531494140625, -0.2550048828125, -0.171478271484375, -0.08795166015625, -0.004425048828125, 0.0791015625, 0.162628173828125, 0.24615478515625, 0.329681396484375, 0.4132080078125, 0.496734619140625, 0.58026123046875, 0.663787841796875, 0.747314453125, 0.830841064453125, 0.91436767578125, 0.997894287109375, 1.0814208984375, 1.164947509765625, 1.24847412109375, 1.332000732421875, 1.41552734375, 1.499053955078125, 1.58258056640625, 1.666107177734375, 1.7496337890625, 1.833160400390625, 1.91668701171875, 2.000213623046875, 2.083740234375, 2.167266845703125, 2.25079345703125, 2.334320068359375, 2.4178466796875, 2.501373291015625, 2.58489990234375, 2.668426513671875, 2.751953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 5.0, 13.0, 10.0, 13.0, 10.0, 13.0, 14.0, 13.0, 16.0, 24.0, 24.0, 32.0, 17.0, 21.0, 30.0, 45.0, 37.0, 38.0, 43.0, 96.0, 461.0, 1522.0, 100.0, 39.0, 44.0, 35.0, 31.0, 42.0, 30.0, 29.0, 20.0, 27.0, 11.0, 19.0, 18.0, 20.0, 16.0, 7.0, 11.0, 11.0, 4.0, 6.0, 5.0, 4.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0], "bins": [-13.875, -13.4671630859375, -13.059326171875, -12.6514892578125, -12.24365234375, -11.8358154296875, -11.427978515625, -11.0201416015625, -10.6123046875, -10.2044677734375, -9.796630859375, -9.3887939453125, -8.98095703125, -8.5731201171875, -8.165283203125, -7.7574462890625, -7.349609375, -6.9417724609375, -6.533935546875, -6.1260986328125, -5.71826171875, -5.3104248046875, -4.902587890625, -4.4947509765625, -4.0869140625, -3.6790771484375, -3.271240234375, -2.8634033203125, -2.45556640625, -2.0477294921875, -1.639892578125, -1.2320556640625, -0.82421875, -0.4163818359375, -0.008544921875, 0.3992919921875, 0.80712890625, 1.2149658203125, 1.622802734375, 2.0306396484375, 2.4384765625, 2.8463134765625, 3.254150390625, 3.6619873046875, 4.06982421875, 4.4776611328125, 4.885498046875, 5.2933349609375, 5.701171875, 6.1090087890625, 6.516845703125, 6.9246826171875, 7.33251953125, 7.7403564453125, 8.148193359375, 8.5560302734375, 8.9638671875, 9.3717041015625, 9.779541015625, 10.1873779296875, 10.59521484375, 11.0030517578125, 11.410888671875, 11.8187255859375, 12.2265625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 5.0, 4.0, 2.0, 2.0, 5.0, 4.0, 9.0, 6.0, 12.0, 5.0, 15.0, 14.0, 15.0, 22.0, 24.0, 16.0, 32.0, 40.0, 56.0, 77.0, 90.0, 152.0, 266.0, 532.0, 1647.0, 31047.0, 3064994.0, 43279.0, 1852.0, 580.0, 294.0, 171.0, 105.0, 59.0, 40.0, 37.0, 37.0, 25.0, 24.0, 14.0, 16.0, 18.0, 9.0, 13.0, 10.0, 15.0, 5.0, 6.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-20.6875, -19.987060546875, -19.28662109375, -18.586181640625, -17.8857421875, -17.185302734375, -16.48486328125, -15.784423828125, -15.083984375, -14.383544921875, -13.68310546875, -12.982666015625, -12.2822265625, -11.581787109375, -10.88134765625, -10.180908203125, -9.48046875, -8.780029296875, -8.07958984375, -7.379150390625, -6.6787109375, -5.978271484375, -5.27783203125, -4.577392578125, -3.876953125, -3.176513671875, -2.47607421875, -1.775634765625, -1.0751953125, -0.374755859375, 0.32568359375, 1.026123046875, 1.7265625, 2.427001953125, 3.12744140625, 3.827880859375, 4.5283203125, 5.228759765625, 5.92919921875, 6.629638671875, 7.330078125, 8.030517578125, 8.73095703125, 9.431396484375, 10.1318359375, 10.832275390625, 11.53271484375, 12.233154296875, 12.93359375, 13.634033203125, 14.33447265625, 15.034912109375, 15.7353515625, 16.435791015625, 17.13623046875, 17.836669921875, 18.537109375, 19.237548828125, 19.93798828125, 20.638427734375, 21.3388671875, 22.039306640625, 22.73974609375, 23.440185546875, 24.140625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 7.0, 29.0, 112.0, 224.0, 290.0, 192.0, 117.0, 27.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.649145126342773, -27.79249382019043, -26.935842514038086, -26.079191207885742, -25.22254180908203, -24.365890502929688, -23.509239196777344, -22.652587890625, -21.795936584472656, -20.939285278320312, -20.08263397216797, -19.225982666015625, -18.36933135986328, -17.512680053710938, -16.656030654907227, -15.799379348754883, -14.942728042602539, -14.086076736450195, -13.229425430297852, -12.372775077819824, -11.51612377166748, -10.659472465515137, -9.80282211303711, -8.946170806884766, -8.089519500732422, -7.232868194580078, -6.376217365264893, -5.519566535949707, -4.662915229797363, -3.8062639236450195, -2.949613094329834, -2.0929622650146484, -1.2363128662109375, -0.37966179847717285, 0.4769892692565918, 1.3336403369903564, 2.190291404724121, 3.046942710876465, 3.9035935401916504, 4.760244369506836, 5.61689567565918, 6.473546981811523, 7.330197811126709, 8.186848640441895, 9.043499946594238, 9.900151252746582, 10.75680160522461, 11.613452911376953, 12.470104217529297, 13.32675552368164, 14.183406829833984, 15.040057182312012, 15.896708488464355, 16.753360748291016, 17.610010147094727, 18.46666145324707, 19.323312759399414, 20.179964065551758, 21.0366153717041, 21.893266677856445, 22.749916076660156, 23.6065673828125, 24.463218688964844, 25.319869995117188, 26.17652130126953]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 7.0, 11.0, 8.0, 17.0, 14.0, 11.0, 17.0, 16.0, 22.0, 26.0, 35.0, 22.0, 37.0, 41.0, 35.0, 42.0, 53.0, 45.0, 34.0, 42.0, 44.0, 35.0, 42.0, 39.0, 34.0, 38.0, 27.0, 26.0, 30.0, 26.0, 23.0, 16.0, 18.0, 5.0, 11.0, 5.0, 12.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.485774993896484, -46.898109436035156, -45.310447692871094, -43.722782135009766, -42.1351203918457, -40.547454833984375, -38.95979309082031, -37.372127532958984, -35.784461975097656, -34.19679641723633, -32.609134674072266, -31.021469116210938, -29.433805465698242, -27.846141815185547, -26.25847816467285, -24.670814514160156, -23.08315086364746, -21.495487213134766, -19.90782356262207, -18.320159912109375, -16.732494354248047, -15.144830703735352, -13.557167053222656, -11.969502449035645, -10.38183879852295, -8.794175148010254, -7.206510543823242, -5.618846893310547, -4.031182765960693, -2.44351863861084, -0.8558549880981445, 0.7318096160888672, 2.3194732666015625, 3.907137393951416, 5.4948015213012695, 7.082465171813965, 8.670129776000977, 10.257793426513672, 11.845457077026367, 13.433121681213379, 15.020785331726074, 16.608449935913086, 18.19611358642578, 19.783777236938477, 21.371440887451172, 22.9591064453125, 24.546768188476562, 26.13443374633789, 27.722097396850586, 29.30976104736328, 30.897424697875977, 32.48508834838867, 34.07275390625, 35.66041564941406, 37.24808120727539, 38.83574676513672, 40.42340850830078, 42.01107406616211, 43.59873580932617, 45.1864013671875, 46.77406311035156, 48.36172866821289, 49.94939422607422, 51.53705596923828, 53.12472152709961]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 5.0, 6.0, 3.0, 8.0, 11.0, 9.0, 10.0, 7.0, 12.0, 22.0, 17.0, 22.0, 28.0, 15.0, 35.0, 33.0, 37.0, 39.0, 30.0, 40.0, 28.0, 35.0, 33.0, 43.0, 48.0, 42.0, 28.0, 37.0, 29.0, 28.0, 25.0, 24.0, 33.0, 24.0, 23.0, 21.0, 23.0, 15.0, 14.0, 12.0, 9.0, 11.0, 9.0, 4.0, 2.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.76953125, -3.6439208984375, -3.518310546875, -3.3927001953125, -3.26708984375, -3.1414794921875, -3.015869140625, -2.8902587890625, -2.7646484375, -2.6390380859375, -2.513427734375, -2.3878173828125, -2.26220703125, -2.1365966796875, -2.010986328125, -1.8853759765625, -1.759765625, -1.6341552734375, -1.508544921875, -1.3829345703125, -1.25732421875, -1.1317138671875, -1.006103515625, -0.8804931640625, -0.7548828125, -0.6292724609375, -0.503662109375, -0.3780517578125, -0.25244140625, -0.1268310546875, -0.001220703125, 0.1243896484375, 0.25, 0.3756103515625, 0.501220703125, 0.6268310546875, 0.75244140625, 0.8780517578125, 1.003662109375, 1.1292724609375, 1.2548828125, 1.3804931640625, 1.506103515625, 1.6317138671875, 1.75732421875, 1.8829345703125, 2.008544921875, 2.1341552734375, 2.259765625, 2.3853759765625, 2.510986328125, 2.6365966796875, 2.76220703125, 2.8878173828125, 3.013427734375, 3.1390380859375, 3.2646484375, 3.3902587890625, 3.515869140625, 3.6414794921875, 3.76708984375, 3.8927001953125, 4.018310546875, 4.1439208984375, 4.26953125]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 5.0, 14.0, 6.0, 10.0, 6.0, 6.0, 8.0, 27.0, 13.0, 28.0, 18.0, 34.0, 27.0, 31.0, 26.0, 33.0, 68.0, 134.0, 403.0, 2336.0, 72422.0, 3807337.0, 305726.0, 4451.0, 538.0, 174.0, 71.0, 36.0, 36.0, 29.0, 28.0, 25.0, 22.0, 22.0, 20.0, 20.0, 16.0, 15.0, 13.0, 10.0, 7.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.15625, -24.36083984375, -23.5654296875, -22.77001953125, -21.974609375, -21.17919921875, -20.3837890625, -19.58837890625, -18.79296875, -17.99755859375, -17.2021484375, -16.40673828125, -15.611328125, -14.81591796875, -14.0205078125, -13.22509765625, -12.4296875, -11.63427734375, -10.8388671875, -10.04345703125, -9.248046875, -8.45263671875, -7.6572265625, -6.86181640625, -6.06640625, -5.27099609375, -4.4755859375, -3.68017578125, -2.884765625, -2.08935546875, -1.2939453125, -0.49853515625, 0.296875, 1.09228515625, 1.8876953125, 2.68310546875, 3.478515625, 4.27392578125, 5.0693359375, 5.86474609375, 6.66015625, 7.45556640625, 8.2509765625, 9.04638671875, 9.841796875, 10.63720703125, 11.4326171875, 12.22802734375, 13.0234375, 13.81884765625, 14.6142578125, 15.40966796875, 16.205078125, 17.00048828125, 17.7958984375, 18.59130859375, 19.38671875, 20.18212890625, 20.9775390625, 21.77294921875, 22.568359375, 23.36376953125, 24.1591796875, 24.95458984375, 25.75]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 11.0, 9.0, 20.0, 22.0, 25.0, 42.0, 60.0, 76.0, 129.0, 184.0, 263.0, 351.0, 500.0, 567.0, 473.0, 397.0, 297.0, 193.0, 131.0, 96.0, 76.0, 50.0, 34.0, 19.0, 13.0, 14.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3828125, -14.9093017578125, -14.435791015625, -13.9622802734375, -13.48876953125, -13.0152587890625, -12.541748046875, -12.0682373046875, -11.5947265625, -11.1212158203125, -10.647705078125, -10.1741943359375, -9.70068359375, -9.2271728515625, -8.753662109375, -8.2801513671875, -7.806640625, -7.3331298828125, -6.859619140625, -6.3861083984375, -5.91259765625, -5.4390869140625, -4.965576171875, -4.4920654296875, -4.0185546875, -3.5450439453125, -3.071533203125, -2.5980224609375, -2.12451171875, -1.6510009765625, -1.177490234375, -0.7039794921875, -0.23046875, 0.2430419921875, 0.716552734375, 1.1900634765625, 1.66357421875, 2.1370849609375, 2.610595703125, 3.0841064453125, 3.5576171875, 4.0311279296875, 4.504638671875, 4.9781494140625, 5.45166015625, 5.9251708984375, 6.398681640625, 6.8721923828125, 7.345703125, 7.8192138671875, 8.292724609375, 8.7662353515625, 9.23974609375, 9.7132568359375, 10.186767578125, 10.6602783203125, 11.1337890625, 11.6072998046875, 12.080810546875, 12.5543212890625, 13.02783203125, 13.5013427734375, 13.974853515625, 14.4483642578125, 14.921875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 7.0, 11.0, 22.0, 22.0, 35.0, 59.0, 76.0, 122.0, 178.0, 298.0, 683.0, 3983.0, 2595022.0, 1589168.0, 3272.0, 587.0, 272.0, 160.0, 89.0, 68.0, 50.0, 31.0, 34.0, 6.0, 10.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0625, -62.8916015625, -60.720703125, -58.5498046875, -56.37890625, -54.2080078125, -52.037109375, -49.8662109375, -47.6953125, -45.5244140625, -43.353515625, -41.1826171875, -39.01171875, -36.8408203125, -34.669921875, -32.4990234375, -30.328125, -28.1572265625, -25.986328125, -23.8154296875, -21.64453125, -19.4736328125, -17.302734375, -15.1318359375, -12.9609375, -10.7900390625, -8.619140625, -6.4482421875, -4.27734375, -2.1064453125, 0.064453125, 2.2353515625, 4.40625, 6.5771484375, 8.748046875, 10.9189453125, 13.08984375, 15.2607421875, 17.431640625, 19.6025390625, 21.7734375, 23.9443359375, 26.115234375, 28.2861328125, 30.45703125, 32.6279296875, 34.798828125, 36.9697265625, 39.140625, 41.3115234375, 43.482421875, 45.6533203125, 47.82421875, 49.9951171875, 52.166015625, 54.3369140625, 56.5078125, 58.6787109375, 60.849609375, 63.0205078125, 65.19140625, 67.3623046875, 69.533203125, 71.7041015625, 73.875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 61.0, 452.0, 437.0, 56.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-422.2078857421875, -414.2410888671875, -406.2742919921875, -398.3074951171875, -390.3406982421875, -382.3739318847656, -374.4071350097656, -366.4403381347656, -358.4735412597656, -350.5067443847656, -342.5399475097656, -334.5731506347656, -326.60638427734375, -318.63958740234375, -310.67279052734375, -302.70599365234375, -294.73919677734375, -286.77239990234375, -278.80560302734375, -270.83880615234375, -262.87200927734375, -254.9052276611328, -246.93844604492188, -238.97164916992188, -231.00485229492188, -223.03805541992188, -215.07125854492188, -207.10447692871094, -199.13768005371094, -191.17088317871094, -183.2041015625, -175.2373046875, -167.2705078125, -159.3037109375, -151.3369140625, -143.37013244628906, -135.40333557128906, -127.43653869628906, -119.4697494506836, -111.50296020507812, -103.53617095947266, -95.56938171386719, -87.60258483886719, -79.63578796386719, -71.66899871826172, -63.702205657958984, -55.73541259765625, -47.768619537353516, -39.80182647705078, -31.835033416748047, -23.868240356445312, -15.901447296142578, -7.934654235839844, 0.032138824462890625, 7.998931884765625, 15.96572494506836, 23.932518005371094, 31.899311065673828, 39.86610412597656, 47.8328971862793, 55.79969024658203, 63.766483306884766, 71.7332763671875, 79.7000732421875, 87.66686248779297]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 4.0, 3.0, 9.0, 8.0, 7.0, 8.0, 9.0, 18.0, 23.0, 31.0, 27.0, 24.0, 25.0, 39.0, 26.0, 40.0, 36.0, 33.0, 40.0, 40.0, 42.0, 40.0, 43.0, 36.0, 42.0, 44.0, 32.0, 35.0, 33.0, 32.0, 29.0, 18.0, 26.0, 14.0, 15.0, 13.0, 12.0, 11.0, 9.0, 4.0, 4.0, 3.0, 5.0, 3.0, 2.0, 5.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.354095458984375, -43.87923049926758, -42.40436553955078, -40.92950439453125, -39.45463943481445, -37.979774475097656, -36.504913330078125, -35.03004837036133, -33.55518341064453, -32.080318450927734, -30.60545539855957, -29.130592346191406, -27.65572738647461, -26.180862426757812, -24.70599937438965, -23.231136322021484, -21.756271362304688, -20.28140640258789, -18.806543350219727, -17.331680297851562, -15.856815338134766, -14.381951332092285, -12.907087326049805, -11.432223320007324, -9.957359313964844, -8.482495307922363, -7.007631301879883, -5.532767295837402, -4.057903289794922, -2.5830392837524414, -1.108175277709961, 0.36668872833251953, 1.841552734375, 3.3164167404174805, 4.791280746459961, 6.266144752502441, 7.741008758544922, 9.215872764587402, 10.690736770629883, 12.165600776672363, 13.640464782714844, 15.115328788757324, 16.590192794799805, 18.06505584716797, 19.539920806884766, 21.014785766601562, 22.489648818969727, 23.96451187133789, 25.439376831054688, 26.914241790771484, 28.38910484313965, 29.863967895507812, 31.33883285522461, 32.813697814941406, 34.28855895996094, 35.763423919677734, 37.23828887939453, 38.71315383911133, 40.188018798828125, 41.662879943847656, 43.13774490356445, 44.61260986328125, 46.08747100830078, 47.56233596801758, 49.037200927734375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 9.0, 11.0, 6.0, 13.0, 14.0, 21.0, 23.0, 24.0, 32.0, 29.0, 35.0, 27.0, 24.0, 35.0, 37.0, 41.0, 41.0, 44.0, 47.0, 35.0, 37.0, 46.0, 48.0, 23.0, 33.0, 27.0, 28.0, 24.0, 29.0, 22.0, 21.0, 22.0, 21.0, 12.0, 12.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.750762939453125, -3.61285400390625, -3.474945068359375, -3.3370361328125, -3.199127197265625, -3.06121826171875, -2.923309326171875, -2.785400390625, -2.647491455078125, -2.50958251953125, -2.371673583984375, -2.2337646484375, -2.095855712890625, -1.95794677734375, -1.820037841796875, -1.68212890625, -1.544219970703125, -1.40631103515625, -1.268402099609375, -1.1304931640625, -0.992584228515625, -0.85467529296875, -0.716766357421875, -0.578857421875, -0.440948486328125, -0.30303955078125, -0.165130615234375, -0.0272216796875, 0.110687255859375, 0.24859619140625, 0.386505126953125, 0.5244140625, 0.662322998046875, 0.80023193359375, 0.938140869140625, 1.0760498046875, 1.213958740234375, 1.35186767578125, 1.489776611328125, 1.627685546875, 1.765594482421875, 1.90350341796875, 2.041412353515625, 2.1793212890625, 2.317230224609375, 2.45513916015625, 2.593048095703125, 2.73095703125, 2.868865966796875, 3.00677490234375, 3.144683837890625, 3.2825927734375, 3.420501708984375, 3.55841064453125, 3.696319580078125, 3.834228515625, 3.972137451171875, 4.11004638671875, 4.247955322265625, 4.3858642578125, 4.523773193359375, 4.66168212890625, 4.799591064453125, 4.9375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 11.0, 11.0, 15.0, 17.0, 41.0, 51.0, 71.0, 150.0, 199.0, 308.0, 468.0, 704.0, 1133.0, 1774.0, 2803.0, 4348.0, 7042.0, 11512.0, 18448.0, 30253.0, 51191.0, 90853.0, 190803.0, 327302.0, 133220.0, 70293.0, 40867.0, 24560.0, 15001.0, 9332.0, 5679.0, 3675.0, 2298.0, 1487.0, 957.0, 599.0, 390.0, 243.0, 168.0, 103.0, 63.0, 45.0, 26.0, 14.0, 13.0, 15.0, 3.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0087890625, -0.9765472412109375, -0.944305419921875, -0.9120635986328125, -0.87982177734375, -0.8475799560546875, -0.815338134765625, -0.7830963134765625, -0.7508544921875, -0.7186126708984375, -0.686370849609375, -0.6541290283203125, -0.62188720703125, -0.5896453857421875, -0.557403564453125, -0.5251617431640625, -0.492919921875, -0.4606781005859375, -0.428436279296875, -0.3961944580078125, -0.36395263671875, -0.3317108154296875, -0.299468994140625, -0.2672271728515625, -0.2349853515625, -0.2027435302734375, -0.170501708984375, -0.1382598876953125, -0.10601806640625, -0.0737762451171875, -0.041534423828125, -0.0092926025390625, 0.02294921875, 0.0551910400390625, 0.087432861328125, 0.1196746826171875, 0.15191650390625, 0.1841583251953125, 0.216400146484375, 0.2486419677734375, 0.2808837890625, 0.3131256103515625, 0.345367431640625, 0.3776092529296875, 0.40985107421875, 0.4420928955078125, 0.474334716796875, 0.5065765380859375, 0.538818359375, 0.5710601806640625, 0.603302001953125, 0.6355438232421875, 0.66778564453125, 0.7000274658203125, 0.732269287109375, 0.7645111083984375, 0.7967529296875, 0.8289947509765625, 0.861236572265625, 0.8934783935546875, 0.92572021484375, 0.9579620361328125, 0.990203857421875, 1.0224456787109375, 1.0546875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 7.0, 5.0, 8.0, 7.0, 9.0, 10.0, 17.0, 14.0, 15.0, 24.0, 15.0, 20.0, 41.0, 41.0, 39.0, 39.0, 35.0, 39.0, 43.0, 49.0, 1086.0, 50.0, 50.0, 44.0, 36.0, 34.0, 46.0, 22.0, 31.0, 24.0, 23.0, 21.0, 14.0, 17.0, 11.0, 11.0, 2.0, 13.0, 3.0, 3.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.3046875, -3.2047119140625, -3.104736328125, -3.0047607421875, -2.90478515625, -2.8048095703125, -2.704833984375, -2.6048583984375, -2.5048828125, -2.4049072265625, -2.304931640625, -2.2049560546875, -2.10498046875, -2.0050048828125, -1.905029296875, -1.8050537109375, -1.705078125, -1.6051025390625, -1.505126953125, -1.4051513671875, -1.30517578125, -1.2052001953125, -1.105224609375, -1.0052490234375, -0.9052734375, -0.8052978515625, -0.705322265625, -0.6053466796875, -0.50537109375, -0.4053955078125, -0.305419921875, -0.2054443359375, -0.10546875, -0.0054931640625, 0.094482421875, 0.1944580078125, 0.29443359375, 0.3944091796875, 0.494384765625, 0.5943603515625, 0.6943359375, 0.7943115234375, 0.894287109375, 0.9942626953125, 1.09423828125, 1.1942138671875, 1.294189453125, 1.3941650390625, 1.494140625, 1.5941162109375, 1.694091796875, 1.7940673828125, 1.89404296875, 1.9940185546875, 2.093994140625, 2.1939697265625, 2.2939453125, 2.3939208984375, 2.493896484375, 2.5938720703125, 2.69384765625, 2.7938232421875, 2.893798828125, 2.9937744140625, 3.09375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 2.0, 9.0, 10.0, 14.0, 23.0, 44.0, 49.0, 101.0, 185.0, 326.0, 634.0, 1173.0, 2262.0, 4225.0, 8605.0, 17410.0, 37750.0, 88782.0, 292159.0, 1451944.0, 106557.0, 44383.0, 20186.0, 9904.0, 4917.0, 2568.0, 1330.0, 683.0, 382.0, 210.0, 116.0, 59.0, 39.0, 27.0, 11.0, 12.0, 12.0, 6.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.4659423828125, -1.417236328125, -1.3685302734375, -1.31982421875, -1.2711181640625, -1.222412109375, -1.1737060546875, -1.125, -1.0762939453125, -1.027587890625, -0.9788818359375, -0.93017578125, -0.8814697265625, -0.832763671875, -0.7840576171875, -0.7353515625, -0.6866455078125, -0.637939453125, -0.5892333984375, -0.54052734375, -0.4918212890625, -0.443115234375, -0.3944091796875, -0.345703125, -0.2969970703125, -0.248291015625, -0.1995849609375, -0.15087890625, -0.1021728515625, -0.053466796875, -0.0047607421875, 0.0439453125, 0.0926513671875, 0.141357421875, 0.1900634765625, 0.23876953125, 0.2874755859375, 0.336181640625, 0.3848876953125, 0.43359375, 0.4822998046875, 0.531005859375, 0.5797119140625, 0.62841796875, 0.6771240234375, 0.725830078125, 0.7745361328125, 0.8232421875, 0.8719482421875, 0.920654296875, 0.9693603515625, 1.01806640625, 1.0667724609375, 1.115478515625, 1.1641845703125, 1.212890625, 1.2615966796875, 1.310302734375, 1.3590087890625, 1.40771484375, 1.4564208984375, 1.505126953125, 1.5538330078125, 1.6025390625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 0.0, 4.0, 9.0, 10.0, 10.0, 8.0, 9.0, 7.0, 7.0, 12.0, 13.0, 19.0, 23.0, 25.0, 25.0, 35.0, 63.0, 37.0, 56.0, 54.0, 67.0, 70.0, 72.0, 61.0, 51.0, 47.0, 40.0, 21.0, 27.0, 23.0, 14.0, 14.0, 14.0, 7.0, 7.0, 11.0, 4.0, 3.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007233619689941406, -0.0006991773843765259, -0.0006749927997589111, -0.0006508082151412964, -0.0006266236305236816, -0.0006024390459060669, -0.0005782544612884521, -0.0005540698766708374, -0.0005298852920532227, -0.0005057007074356079, -0.00048151612281799316, -0.0004573315382003784, -0.00043314695358276367, -0.0004089623689651489, -0.0003847777843475342, -0.00036059319972991943, -0.0003364086151123047, -0.00031222403049468994, -0.0002880394458770752, -0.00026385486125946045, -0.0002396702766418457, -0.00021548569202423096, -0.0001913011074066162, -0.00016711652278900146, -0.00014293193817138672, -0.00011874735355377197, -9.456276893615723e-05, -7.037818431854248e-05, -4.6193599700927734e-05, -2.2009015083312988e-05, 2.175569534301758e-06, 2.6360154151916504e-05, 5.054473876953125e-05, 7.4729323387146e-05, 9.891390800476074e-05, 0.0001230984926223755, 0.00014728307723999023, 0.00017146766185760498, 0.00019565224647521973, 0.00021983683109283447, 0.00024402141571044922, 0.00026820600032806396, 0.0002923905849456787, 0.00031657516956329346, 0.0003407597541809082, 0.00036494433879852295, 0.0003891289234161377, 0.00041331350803375244, 0.0004374980926513672, 0.00046168267726898193, 0.0004858672618865967, 0.0005100518465042114, 0.0005342364311218262, 0.0005584210157394409, 0.0005826056003570557, 0.0006067901849746704, 0.0006309747695922852, 0.0006551593542098999, 0.0006793439388275146, 0.0007035285234451294, 0.0007277131080627441, 0.0007518976926803589, 0.0007760822772979736, 0.0008002668619155884, 0.0008244514465332031]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 2.0, 6.0, 5.0, 8.0, 11.0, 13.0, 12.0, 29.0, 26.0, 51.0, 47.0, 87.0, 84.0, 133.0, 161.0, 308.0, 639.0, 13510.0, 1030109.0, 1975.0, 485.0, 249.0, 137.0, 97.0, 70.0, 77.0, 36.0, 43.0, 23.0, 23.0, 19.0, 17.0, 18.0, 8.0, 5.0, 4.0, 13.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0187530517578125, -0.01820683479309082, -0.01766061782836914, -0.01711440086364746, -0.01656818389892578, -0.0160219669342041, -0.015475749969482422, -0.014929533004760742, -0.014383316040039062, -0.013837099075317383, -0.013290882110595703, -0.012744665145874023, -0.012198448181152344, -0.011652231216430664, -0.011106014251708984, -0.010559797286987305, -0.010013580322265625, -0.009467363357543945, -0.008921146392822266, -0.008374929428100586, -0.007828712463378906, -0.0072824954986572266, -0.006736278533935547, -0.006190061569213867, -0.0056438446044921875, -0.005097627639770508, -0.004551410675048828, -0.0040051937103271484, -0.0034589767456054688, -0.002912759780883789, -0.0023665428161621094, -0.0018203258514404297, -0.00127410888671875, -0.0007278919219970703, -0.00018167495727539062, 0.00036454200744628906, 0.0009107589721679688, 0.0014569759368896484, 0.002003192901611328, 0.002549409866333008, 0.0030956268310546875, 0.003641843795776367, 0.004188060760498047, 0.0047342777252197266, 0.005280494689941406, 0.005826711654663086, 0.006372928619384766, 0.006919145584106445, 0.007465362548828125, 0.008011579513549805, 0.008557796478271484, 0.009104013442993164, 0.009650230407714844, 0.010196447372436523, 0.010742664337158203, 0.011288881301879883, 0.011835098266601562, 0.012381315231323242, 0.012927532196044922, 0.013473749160766602, 0.014019966125488281, 0.014566183090209961, 0.01511240005493164, 0.01565861701965332, 0.016204833984375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 32.0, 375.0, 539.0, 61.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008177493000403047, -0.0007504896493628621, -0.0006832299986854196, -0.0006159702898003161, -0.0005487106391228735, -0.000481450988445431, -0.000414191308664158, -0.000346931628882885, -0.00027967197820544243, -0.00021241231297608465, -0.00014515264774672687, -7.789298251736909e-05, -1.0633317288011312e-05, 5.662633338943124e-05, 0.00012388601317070425, 0.00019114569295197725, 0.0002584053436294198, 0.00032566499430686235, 0.00039292467408813536, 0.00046018435386940837, 0.0005274440045468509, 0.0005947036552242935, 0.0006619633641093969, 0.0007292230147868395, 0.000796482665464282, 0.0008637423161417246, 0.0009310019668191671, 0.0009982616174966097, 0.0010655212681740522, 0.0011327809188514948, 0.0012000406859442592, 0.0012673003366217017, 0.001334560103714466, 0.0014018197543919086, 0.0014690794050693512, 0.0015363390557467937, 0.0016035987064242363, 0.0016708583571016788, 0.0017381181241944432, 0.0018053777748718858, 0.0018726374255493283, 0.0019398970762267709, 0.0020071568433195353, 0.002074416493996978, 0.0021416761446744204, 0.002208935795351863, 0.0022761954460293055, 0.002343455096706748, 0.0024107147473841906, 0.002477974398061633, 0.0025452340487390757, 0.002612493699416518, 0.0026797533500939608, 0.0027470130007714033, 0.002814272651448846, 0.002881532534956932, 0.0029487921856343746, 0.003016051836311817, 0.0030833114869892597, 0.0031505711376667023, 0.003217830788344145, 0.0032850904390215874, 0.00335235008969903, 0.0034196097403764725, 0.003486869391053915]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 7.0, 8.0, 6.0, 10.0, 11.0, 17.0, 17.0, 19.0, 15.0, 26.0, 20.0, 23.0, 24.0, 24.0, 23.0, 39.0, 37.0, 37.0, 34.0, 38.0, 38.0, 40.0, 47.0, 42.0, 41.0, 38.0, 37.0, 37.0, 17.0, 28.0, 26.0, 22.0, 19.0, 16.0, 20.0, 19.0, 13.0, 10.0, 6.0, 4.0, 3.0, 6.0, 5.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0], "bins": [-0.0004006624221801758, -0.0003885813057422638, -0.0003765001893043518, -0.0003644190728664398, -0.00035233795642852783, -0.00034025683999061584, -0.00032817572355270386, -0.00031609460711479187, -0.0003040134906768799, -0.0002919323742389679, -0.0002798512578010559, -0.0002677701413631439, -0.00025568902492523193, -0.00024360790848731995, -0.00023152679204940796, -0.00021944567561149597, -0.00020736455917358398, -0.000195283442735672, -0.00018320232629776, -0.00017112120985984802, -0.00015904009342193604, -0.00014695897698402405, -0.00013487786054611206, -0.00012279674410820007, -0.00011071562767028809, -9.86345112323761e-05, -8.655339479446411e-05, -7.447227835655212e-05, -6.239116191864014e-05, -5.031004548072815e-05, -3.822892904281616e-05, -2.6147812604904175e-05, -1.4066696166992188e-05, -1.9855797290802e-06, 1.0095536708831787e-05, 2.2176653146743774e-05, 3.425776958465576e-05, 4.633888602256775e-05, 5.8420002460479736e-05, 7.050111889839172e-05, 8.258223533630371e-05, 9.46633517742157e-05, 0.00010674446821212769, 0.00011882558465003967, 0.00013090670108795166, 0.00014298781752586365, 0.00015506893396377563, 0.00016715005040168762, 0.0001792311668395996, 0.0001913122832775116, 0.00020339339971542358, 0.00021547451615333557, 0.00022755563259124756, 0.00023963674902915955, 0.00025171786546707153, 0.0002637989819049835, 0.0002758800983428955, 0.0002879612147808075, 0.0003000423312187195, 0.00031212344765663147, 0.00032420456409454346, 0.00033628568053245544, 0.00034836679697036743, 0.0003604479134082794, 0.0003725290298461914]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 9.0, 11.0, 6.0, 13.0, 14.0, 21.0, 23.0, 24.0, 32.0, 29.0, 35.0, 27.0, 24.0, 35.0, 37.0, 41.0, 41.0, 44.0, 47.0, 35.0, 37.0, 46.0, 48.0, 23.0, 33.0, 27.0, 28.0, 24.0, 29.0, 22.0, 21.0, 22.0, 21.0, 12.0, 12.0, 9.0, 7.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.888671875, -3.750762939453125, -3.61285400390625, -3.474945068359375, -3.3370361328125, -3.199127197265625, -3.06121826171875, -2.923309326171875, -2.785400390625, -2.647491455078125, -2.50958251953125, -2.371673583984375, -2.2337646484375, -2.095855712890625, -1.95794677734375, -1.820037841796875, -1.68212890625, -1.544219970703125, -1.40631103515625, -1.268402099609375, -1.1304931640625, -0.992584228515625, -0.85467529296875, -0.716766357421875, -0.578857421875, -0.440948486328125, -0.30303955078125, -0.165130615234375, -0.0272216796875, 0.110687255859375, 0.24859619140625, 0.386505126953125, 0.5244140625, 0.662322998046875, 0.80023193359375, 0.938140869140625, 1.0760498046875, 1.213958740234375, 1.35186767578125, 1.489776611328125, 1.627685546875, 1.765594482421875, 1.90350341796875, 2.041412353515625, 2.1793212890625, 2.317230224609375, 2.45513916015625, 2.593048095703125, 2.73095703125, 2.868865966796875, 3.00677490234375, 3.144683837890625, 3.2825927734375, 3.420501708984375, 3.55841064453125, 3.696319580078125, 3.834228515625, 3.972137451171875, 4.11004638671875, 4.247955322265625, 4.3858642578125, 4.523773193359375, 4.66168212890625, 4.799591064453125, 4.9375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 4.0, 9.0, 13.0, 14.0, 30.0, 33.0, 57.0, 83.0, 138.0, 251.0, 448.0, 785.0, 1515.0, 3276.0, 8523.0, 27940.0, 150028.0, 650259.0, 160477.0, 28962.0, 8819.0, 3466.0, 1600.0, 769.0, 399.0, 265.0, 164.0, 81.0, 59.0, 34.0, 18.0, 14.0, 11.0, 4.0, 4.0, 6.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6875, -4.5286865234375, -4.369873046875, -4.2110595703125, -4.05224609375, -3.8934326171875, -3.734619140625, -3.5758056640625, -3.4169921875, -3.2581787109375, -3.099365234375, -2.9405517578125, -2.78173828125, -2.6229248046875, -2.464111328125, -2.3052978515625, -2.146484375, -1.9876708984375, -1.828857421875, -1.6700439453125, -1.51123046875, -1.3524169921875, -1.193603515625, -1.0347900390625, -0.8759765625, -0.7171630859375, -0.558349609375, -0.3995361328125, -0.24072265625, -0.0819091796875, 0.076904296875, 0.2357177734375, 0.39453125, 0.5533447265625, 0.712158203125, 0.8709716796875, 1.02978515625, 1.1885986328125, 1.347412109375, 1.5062255859375, 1.6650390625, 1.8238525390625, 1.982666015625, 2.1414794921875, 2.30029296875, 2.4591064453125, 2.617919921875, 2.7767333984375, 2.935546875, 3.0943603515625, 3.253173828125, 3.4119873046875, 3.57080078125, 3.7296142578125, 3.888427734375, 4.0472412109375, 4.2060546875, 4.3648681640625, 4.523681640625, 4.6824951171875, 4.84130859375, 5.0001220703125, 5.158935546875, 5.3177490234375, 5.4765625]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 4.0, 7.0, 10.0, 8.0, 10.0, 13.0, 17.0, 25.0, 26.0, 23.0, 29.0, 32.0, 27.0, 38.0, 45.0, 57.0, 61.0, 84.0, 1721.0, 349.0, 54.0, 47.0, 32.0, 31.0, 36.0, 31.0, 35.0, 40.0, 27.0, 29.0, 15.0, 11.0, 14.0, 10.0, 12.0, 11.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.546875, -16.0426025390625, -15.538330078125, -15.0340576171875, -14.52978515625, -14.0255126953125, -13.521240234375, -13.0169677734375, -12.5126953125, -12.0084228515625, -11.504150390625, -10.9998779296875, -10.49560546875, -9.9913330078125, -9.487060546875, -8.9827880859375, -8.478515625, -7.9742431640625, -7.469970703125, -6.9656982421875, -6.46142578125, -5.9571533203125, -5.452880859375, -4.9486083984375, -4.4443359375, -3.9400634765625, -3.435791015625, -2.9315185546875, -2.42724609375, -1.9229736328125, -1.418701171875, -0.9144287109375, -0.41015625, 0.0941162109375, 0.598388671875, 1.1026611328125, 1.60693359375, 2.1112060546875, 2.615478515625, 3.1197509765625, 3.6240234375, 4.1282958984375, 4.632568359375, 5.1368408203125, 5.64111328125, 6.1453857421875, 6.649658203125, 7.1539306640625, 7.658203125, 8.1624755859375, 8.666748046875, 9.1710205078125, 9.67529296875, 10.1795654296875, 10.683837890625, 11.1881103515625, 11.6923828125, 12.1966552734375, 12.700927734375, 13.2052001953125, 13.70947265625, 14.2137451171875, 14.718017578125, 15.2222900390625, 15.7265625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 11.0, 11.0, 10.0, 14.0, 23.0, 13.0, 29.0, 45.0, 43.0, 46.0, 61.0, 98.0, 140.0, 260.0, 522.0, 1769.0, 76174.0, 3057087.0, 7466.0, 817.0, 379.0, 212.0, 118.0, 68.0, 53.0, 44.0, 38.0, 25.0, 24.0, 20.0, 20.0, 6.0, 10.0, 8.0, 9.0, 6.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.984375, -25.1533203125, -24.322265625, -23.4912109375, -22.66015625, -21.8291015625, -20.998046875, -20.1669921875, -19.3359375, -18.5048828125, -17.673828125, -16.8427734375, -16.01171875, -15.1806640625, -14.349609375, -13.5185546875, -12.6875, -11.8564453125, -11.025390625, -10.1943359375, -9.36328125, -8.5322265625, -7.701171875, -6.8701171875, -6.0390625, -5.2080078125, -4.376953125, -3.5458984375, -2.71484375, -1.8837890625, -1.052734375, -0.2216796875, 0.609375, 1.4404296875, 2.271484375, 3.1025390625, 3.93359375, 4.7646484375, 5.595703125, 6.4267578125, 7.2578125, 8.0888671875, 8.919921875, 9.7509765625, 10.58203125, 11.4130859375, 12.244140625, 13.0751953125, 13.90625, 14.7373046875, 15.568359375, 16.3994140625, 17.23046875, 18.0615234375, 18.892578125, 19.7236328125, 20.5546875, 21.3857421875, 22.216796875, 23.0478515625, 23.87890625, 24.7099609375, 25.541015625, 26.3720703125, 27.203125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 26.0, 72.0, 150.0, 229.0, 226.0, 162.0, 87.0, 32.0, 15.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.63768768310547, -25.990318298339844, -25.34294891357422, -24.69557762145996, -24.048208236694336, -23.40083885192871, -22.753469467163086, -22.10610008239746, -21.458728790283203, -20.811359405517578, -20.163990020751953, -19.516618728637695, -18.86924934387207, -18.221879959106445, -17.57451057434082, -16.927141189575195, -16.27977180480957, -15.632402420043945, -14.985032081604004, -14.337662696838379, -13.690292358398438, -13.042922973632812, -12.395553588867188, -11.748184204101562, -11.100813865661621, -10.453444480895996, -9.806074142456055, -9.15870475769043, -8.511335372924805, -7.863965034484863, -7.216595649719238, -6.569225788116455, -5.921857833862305, -5.2744879722595215, -4.627118110656738, -3.9797487258911133, -3.33237886428833, -2.685009002685547, -2.0376393795013428, -1.3902697563171387, -0.7428998947143555, -0.09553015232086182, 0.5518395900726318, 1.1992093324661255, 1.8465790748596191, 2.4939489364624023, 3.1413185596466064, 3.7886881828308105, 4.436058044433594, 5.083427906036377, 5.73079776763916, 6.378167152404785, 7.025537014007568, 7.672906875610352, 8.320276260375977, 8.967645645141602, 9.615015983581543, 10.262385368347168, 10.90975570678711, 11.557125091552734, 12.20449447631836, 12.8518648147583, 13.499234199523926, 14.146604537963867, 14.793973922729492]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 5.0, 2.0, 8.0, 8.0, 9.0, 11.0, 14.0, 11.0, 15.0, 23.0, 23.0, 9.0, 25.0, 31.0, 33.0, 31.0, 36.0, 35.0, 32.0, 36.0, 34.0, 45.0, 45.0, 37.0, 42.0, 33.0, 40.0, 34.0, 28.0, 37.0, 30.0, 24.0, 32.0, 22.0, 28.0, 22.0, 17.0, 12.0, 6.0, 11.0, 8.0, 3.0, 3.0, 3.0, 1.0, 2.0, 7.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.205177307128906, -48.695552825927734, -47.18592834472656, -45.67630386352539, -44.16667938232422, -42.65705490112305, -41.147430419921875, -39.63780975341797, -38.12818145751953, -36.61855697631836, -35.10893249511719, -33.599308013916016, -32.089683532714844, -30.580059051513672, -29.070436477661133, -27.56081199645996, -26.051189422607422, -24.54156494140625, -23.031940460205078, -21.522315979003906, -20.012691497802734, -18.503067016601562, -16.993444442749023, -15.483819961547852, -13.97419548034668, -12.464570999145508, -10.954946517944336, -9.44532299041748, -7.935698509216309, -6.426074028015137, -4.916450500488281, -3.4068260192871094, -1.8972015380859375, -0.3875772953033447, 1.122046947479248, 2.6316709518432617, 4.141295433044434, 5.6509199142456055, 7.160543441772461, 8.670167922973633, 10.179792404174805, 11.689416885375977, 13.199041366577148, 14.708664894104004, 16.21828842163086, 17.72791290283203, 19.237537384033203, 20.747161865234375, 22.256786346435547, 23.76641082763672, 25.27603530883789, 26.785659790039062, 28.295284271240234, 29.804908752441406, 31.314531326293945, 32.82415771484375, 34.333778381347656, 35.84340286254883, 37.35302734375, 38.86265182495117, 40.372276306152344, 41.881900787353516, 43.39152526855469, 44.901145935058594, 46.41077423095703]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 0.0, 1.0, 10.0, 8.0, 7.0, 14.0, 2.0, 14.0, 13.0, 21.0, 18.0, 26.0, 32.0, 26.0, 40.0, 29.0, 25.0, 36.0, 34.0, 41.0, 38.0, 46.0, 49.0, 41.0, 35.0, 44.0, 42.0, 27.0, 35.0, 28.0, 32.0, 26.0, 24.0, 23.0, 28.0, 17.0, 19.0, 12.0, 12.0, 9.0, 5.0, 4.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.896484375, -3.75390625, -3.611328125, -3.46875, -3.326171875, -3.18359375, -3.041015625, -2.8984375, -2.755859375, -2.61328125, -2.470703125, -2.328125, -2.185546875, -2.04296875, -1.900390625, -1.7578125, -1.615234375, -1.47265625, -1.330078125, -1.1875, -1.044921875, -0.90234375, -0.759765625, -0.6171875, -0.474609375, -0.33203125, -0.189453125, -0.046875, 0.095703125, 0.23828125, 0.380859375, 0.5234375, 0.666015625, 0.80859375, 0.951171875, 1.09375, 1.236328125, 1.37890625, 1.521484375, 1.6640625, 1.806640625, 1.94921875, 2.091796875, 2.234375, 2.376953125, 2.51953125, 2.662109375, 2.8046875, 2.947265625, 3.08984375, 3.232421875, 3.375, 3.517578125, 3.66015625, 3.802734375, 3.9453125, 4.087890625, 4.23046875, 4.373046875, 4.515625, 4.658203125, 4.80078125, 4.943359375, 5.0859375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 4.0, 5.0, 15.0, 10.0, 19.0, 19.0, 28.0, 25.0, 50.0, 64.0, 116.0, 224.0, 492.0, 1405.0, 6376.0, 46117.0, 730513.0, 2864752.0, 502710.0, 34241.0, 4940.0, 1185.0, 432.0, 203.0, 110.0, 56.0, 46.0, 30.0, 27.0, 19.0, 12.0, 11.0, 9.0, 7.0, 3.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.390625, -9.99755859375, -9.6044921875, -9.21142578125, -8.818359375, -8.42529296875, -8.0322265625, -7.63916015625, -7.24609375, -6.85302734375, -6.4599609375, -6.06689453125, -5.673828125, -5.28076171875, -4.8876953125, -4.49462890625, -4.1015625, -3.70849609375, -3.3154296875, -2.92236328125, -2.529296875, -2.13623046875, -1.7431640625, -1.35009765625, -0.95703125, -0.56396484375, -0.1708984375, 0.22216796875, 0.615234375, 1.00830078125, 1.4013671875, 1.79443359375, 2.1875, 2.58056640625, 2.9736328125, 3.36669921875, 3.759765625, 4.15283203125, 4.5458984375, 4.93896484375, 5.33203125, 5.72509765625, 6.1181640625, 6.51123046875, 6.904296875, 7.29736328125, 7.6904296875, 8.08349609375, 8.4765625, 8.86962890625, 9.2626953125, 9.65576171875, 10.048828125, 10.44189453125, 10.8349609375, 11.22802734375, 11.62109375, 12.01416015625, 12.4072265625, 12.80029296875, 13.193359375, 13.58642578125, 13.9794921875, 14.37255859375, 14.765625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 12.0, 4.0, 12.0, 21.0, 23.0, 37.0, 43.0, 59.0, 119.0, 143.0, 208.0, 312.0, 418.0, 529.0, 557.0, 441.0, 340.0, 248.0, 156.0, 115.0, 107.0, 42.0, 40.0, 34.0, 16.0, 10.0, 7.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1640625, -11.6800537109375, -11.196044921875, -10.7120361328125, -10.22802734375, -9.7440185546875, -9.260009765625, -8.7760009765625, -8.2919921875, -7.8079833984375, -7.323974609375, -6.8399658203125, -6.35595703125, -5.8719482421875, -5.387939453125, -4.9039306640625, -4.419921875, -3.9359130859375, -3.451904296875, -2.9678955078125, -2.48388671875, -1.9998779296875, -1.515869140625, -1.0318603515625, -0.5478515625, -0.0638427734375, 0.420166015625, 0.9041748046875, 1.38818359375, 1.8721923828125, 2.356201171875, 2.8402099609375, 3.32421875, 3.8082275390625, 4.292236328125, 4.7762451171875, 5.26025390625, 5.7442626953125, 6.228271484375, 6.7122802734375, 7.1962890625, 7.6802978515625, 8.164306640625, 8.6483154296875, 9.13232421875, 9.6163330078125, 10.100341796875, 10.5843505859375, 11.068359375, 11.5523681640625, 12.036376953125, 12.5203857421875, 13.00439453125, 13.4884033203125, 13.972412109375, 14.4564208984375, 14.9404296875, 15.4244384765625, 15.908447265625, 16.3924560546875, 16.87646484375, 17.3604736328125, 17.844482421875, 18.3284912109375, 18.8125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 1.0, 8.0, 14.0, 23.0, 32.0, 65.0, 84.0, 174.0, 251.0, 606.0, 17272.0, 4159216.0, 15335.0, 585.0, 255.0, 132.0, 87.0, 57.0, 30.0, 18.0, 15.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.75, -89.08984375, -86.4296875, -83.76953125, -81.109375, -78.44921875, -75.7890625, -73.12890625, -70.46875, -67.80859375, -65.1484375, -62.48828125, -59.828125, -57.16796875, -54.5078125, -51.84765625, -49.1875, -46.52734375, -43.8671875, -41.20703125, -38.546875, -35.88671875, -33.2265625, -30.56640625, -27.90625, -25.24609375, -22.5859375, -19.92578125, -17.265625, -14.60546875, -11.9453125, -9.28515625, -6.625, -3.96484375, -1.3046875, 1.35546875, 4.015625, 6.67578125, 9.3359375, 11.99609375, 14.65625, 17.31640625, 19.9765625, 22.63671875, 25.296875, 27.95703125, 30.6171875, 33.27734375, 35.9375, 38.59765625, 41.2578125, 43.91796875, 46.578125, 49.23828125, 51.8984375, 54.55859375, 57.21875, 59.87890625, 62.5390625, 65.19921875, 67.859375, 70.51953125, 73.1796875, 75.83984375, 78.5]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 6.0, 21.0, 52.0, 103.0, 156.0, 237.0, 174.0, 143.0, 67.0, 24.0, 18.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.07289505004883, -52.53841018676758, -50.00392150878906, -47.46943664550781, -44.93495178222656, -42.40046310424805, -39.8659782409668, -37.33148956298828, -34.79700469970703, -32.26251983642578, -29.728031158447266, -27.193546295166016, -24.659059524536133, -22.12457275390625, -19.590087890625, -17.055601119995117, -14.521114349365234, -11.986627578735352, -9.452141761779785, -6.9176554679870605, -4.383169174194336, -1.8486824035644531, 0.6858034133911133, 3.2202892303466797, 5.7547760009765625, 8.289262771606445, 10.823748588562012, 13.358234405517578, 15.892721176147461, 18.427207946777344, 20.961692810058594, 23.496179580688477, 26.030662536621094, 28.565149307250977, 31.09963607788086, 33.63412094116211, 36.168609619140625, 38.703094482421875, 41.237579345703125, 43.772064208984375, 46.30655288696289, 48.84103775024414, 51.375526428222656, 53.910011291503906, 56.444496154785156, 58.97898483276367, 61.51346969604492, 64.04795837402344, 66.58244323730469, 69.11692810058594, 71.65141296386719, 74.18590545654297, 76.72039031982422, 79.25487518310547, 81.78936004638672, 84.32384490966797, 86.85833740234375, 89.392822265625, 91.92730712890625, 94.46179962158203, 96.99628448486328, 99.53076934814453, 102.06525421142578, 104.59973907470703, 107.13422393798828]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 9.0, 7.0, 10.0, 12.0, 14.0, 20.0, 15.0, 16.0, 27.0, 31.0, 27.0, 32.0, 25.0, 31.0, 51.0, 39.0, 53.0, 46.0, 51.0, 42.0, 38.0, 37.0, 45.0, 54.0, 37.0, 34.0, 23.0, 25.0, 32.0, 24.0, 16.0, 16.0, 20.0, 12.0, 11.0, 7.0, 3.0, 5.0, 1.0, 5.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.55772399902344, -46.00416564941406, -44.45061111450195, -42.89705276489258, -41.3434944152832, -39.789939880371094, -38.23638153076172, -36.682823181152344, -35.12926483154297, -33.575706481933594, -32.022151947021484, -30.46859359741211, -28.915035247802734, -27.361478805541992, -25.80792236328125, -24.254364013671875, -22.700809478759766, -21.147253036499023, -19.59369468688965, -18.040138244628906, -16.48657989501953, -14.933023452758789, -13.379467010498047, -11.825909614562988, -10.27235221862793, -8.718794822692871, -7.165237903594971, -5.61168098449707, -4.058123588562012, -2.504566192626953, -0.9510097503662109, 0.6025476455688477, 2.1561050415039062, 3.7096621990203857, 5.263219356536865, 6.816776275634766, 8.370333671569824, 9.923891067504883, 11.477447509765625, 13.031004905700684, 14.584562301635742, 16.138118743896484, 17.69167709350586, 19.2452335357666, 20.798789978027344, 22.35234832763672, 23.90590476989746, 25.459461212158203, 27.013019561767578, 28.56657600402832, 30.120134353637695, 31.673690795898438, 33.22724914550781, 34.78080749511719, 36.3343620300293, 37.88792037963867, 39.44147491455078, 40.995033264160156, 42.548587799072266, 44.10214614868164, 45.655704498291016, 47.209259033203125, 48.7628173828125, 50.316375732421875, 51.86993408203125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 3.0, 4.0, 7.0, 9.0, 13.0, 10.0, 18.0, 12.0, 12.0, 15.0, 25.0, 20.0, 25.0, 31.0, 26.0, 26.0, 34.0, 36.0, 33.0, 32.0, 47.0, 31.0, 38.0, 39.0, 36.0, 30.0, 37.0, 25.0, 36.0, 28.0, 26.0, 21.0, 26.0, 21.0, 32.0, 20.0, 17.0, 15.0, 25.0, 8.0, 13.0, 9.0, 6.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93359375, -3.80511474609375, -3.6766357421875, -3.54815673828125, -3.419677734375, -3.29119873046875, -3.1627197265625, -3.03424072265625, -2.90576171875, -2.77728271484375, -2.6488037109375, -2.52032470703125, -2.391845703125, -2.26336669921875, -2.1348876953125, -2.00640869140625, -1.8779296875, -1.74945068359375, -1.6209716796875, -1.49249267578125, -1.364013671875, -1.23553466796875, -1.1070556640625, -0.97857666015625, -0.85009765625, -0.72161865234375, -0.5931396484375, -0.46466064453125, -0.336181640625, -0.20770263671875, -0.0792236328125, 0.04925537109375, 0.177734375, 0.30621337890625, 0.4346923828125, 0.56317138671875, 0.691650390625, 0.82012939453125, 0.9486083984375, 1.07708740234375, 1.20556640625, 1.33404541015625, 1.4625244140625, 1.59100341796875, 1.719482421875, 1.84796142578125, 1.9764404296875, 2.10491943359375, 2.2333984375, 2.36187744140625, 2.4903564453125, 2.61883544921875, 2.747314453125, 2.87579345703125, 3.0042724609375, 3.13275146484375, 3.26123046875, 3.38970947265625, 3.5181884765625, 3.64666748046875, 3.775146484375, 3.90362548828125, 4.0321044921875, 4.16058349609375, 4.2890625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 5.0, 9.0, 12.0, 18.0, 23.0, 29.0, 64.0, 102.0, 120.0, 211.0, 302.0, 448.0, 657.0, 962.0, 1386.0, 2140.0, 2952.0, 4422.0, 6171.0, 9108.0, 13294.0, 19470.0, 29745.0, 45700.0, 74071.0, 135202.0, 285091.0, 172679.0, 87692.0, 52816.0, 33662.0, 22571.0, 14906.0, 10270.0, 6865.0, 4760.0, 3330.0, 2232.0, 1590.0, 1109.0, 739.0, 514.0, 366.0, 237.0, 180.0, 111.0, 77.0, 48.0, 38.0, 27.0, 13.0, 6.0, 5.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.7642669677734375, -0.738494873046875, -0.7127227783203125, -0.68695068359375, -0.6611785888671875, -0.635406494140625, -0.6096343994140625, -0.5838623046875, -0.5580902099609375, -0.532318115234375, -0.5065460205078125, -0.48077392578125, -0.4550018310546875, -0.429229736328125, -0.4034576416015625, -0.377685546875, -0.3519134521484375, -0.326141357421875, -0.3003692626953125, -0.27459716796875, -0.2488250732421875, -0.223052978515625, -0.1972808837890625, -0.1715087890625, -0.1457366943359375, -0.119964599609375, -0.0941925048828125, -0.06842041015625, -0.0426483154296875, -0.016876220703125, 0.0088958740234375, 0.03466796875, 0.0604400634765625, 0.086212158203125, 0.1119842529296875, 0.13775634765625, 0.1635284423828125, 0.189300537109375, 0.2150726318359375, 0.2408447265625, 0.2666168212890625, 0.292388916015625, 0.3181610107421875, 0.34393310546875, 0.3697052001953125, 0.395477294921875, 0.4212493896484375, 0.447021484375, 0.4727935791015625, 0.498565673828125, 0.5243377685546875, 0.55010986328125, 0.5758819580078125, 0.601654052734375, 0.6274261474609375, 0.6531982421875, 0.6789703369140625, 0.704742431640625, 0.7305145263671875, 0.75628662109375, 0.7820587158203125, 0.807830810546875, 0.8336029052734375, 0.859375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 1.0, 10.0, 4.0, 19.0, 14.0, 19.0, 21.0, 22.0, 24.0, 35.0, 34.0, 30.0, 43.0, 36.0, 44.0, 57.0, 40.0, 43.0, 1075.0, 36.0, 41.0, 54.0, 33.0, 35.0, 36.0, 30.0, 28.0, 30.0, 18.0, 20.0, 27.0, 18.0, 12.0, 10.0, 7.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.410491943359375, -2.30731201171875, -2.204132080078125, -2.1009521484375, -1.997772216796875, -1.89459228515625, -1.791412353515625, -1.688232421875, -1.585052490234375, -1.48187255859375, -1.378692626953125, -1.2755126953125, -1.172332763671875, -1.06915283203125, -0.965972900390625, -0.86279296875, -0.759613037109375, -0.65643310546875, -0.553253173828125, -0.4500732421875, -0.346893310546875, -0.24371337890625, -0.140533447265625, -0.037353515625, 0.065826416015625, 0.16900634765625, 0.272186279296875, 0.3753662109375, 0.478546142578125, 0.58172607421875, 0.684906005859375, 0.7880859375, 0.891265869140625, 0.99444580078125, 1.097625732421875, 1.2008056640625, 1.303985595703125, 1.40716552734375, 1.510345458984375, 1.613525390625, 1.716705322265625, 1.81988525390625, 1.923065185546875, 2.0262451171875, 2.129425048828125, 2.23260498046875, 2.335784912109375, 2.43896484375, 2.542144775390625, 2.64532470703125, 2.748504638671875, 2.8516845703125, 2.954864501953125, 3.05804443359375, 3.161224365234375, 3.264404296875, 3.367584228515625, 3.47076416015625, 3.573944091796875, 3.6771240234375, 3.780303955078125, 3.88348388671875, 3.986663818359375, 4.08984375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 3.0, 9.0, 12.0, 12.0, 15.0, 33.0, 45.0, 69.0, 90.0, 191.0, 343.0, 656.0, 1361.0, 2927.0, 5937.0, 12901.0, 28348.0, 63633.0, 167742.0, 1524791.0, 170466.0, 64069.0, 28563.0, 12927.0, 6132.0, 2855.0, 1394.0, 709.0, 355.0, 203.0, 111.0, 83.0, 43.0, 27.0, 27.0, 16.0, 15.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.001953125, -1.9512786865234375, -1.900604248046875, -1.8499298095703125, -1.79925537109375, -1.7485809326171875, -1.697906494140625, -1.6472320556640625, -1.5965576171875, -1.5458831787109375, -1.495208740234375, -1.4445343017578125, -1.39385986328125, -1.3431854248046875, -1.292510986328125, -1.2418365478515625, -1.191162109375, -1.1404876708984375, -1.089813232421875, -1.0391387939453125, -0.98846435546875, -0.9377899169921875, -0.887115478515625, -0.8364410400390625, -0.7857666015625, -0.7350921630859375, -0.684417724609375, -0.6337432861328125, -0.58306884765625, -0.5323944091796875, -0.481719970703125, -0.4310455322265625, -0.38037109375, -0.3296966552734375, -0.279022216796875, -0.2283477783203125, -0.17767333984375, -0.1269989013671875, -0.076324462890625, -0.0256500244140625, 0.0250244140625, 0.0756988525390625, 0.126373291015625, 0.1770477294921875, 0.22772216796875, 0.2783966064453125, 0.329071044921875, 0.3797454833984375, 0.430419921875, 0.4810943603515625, 0.531768798828125, 0.5824432373046875, 0.63311767578125, 0.6837921142578125, 0.734466552734375, 0.7851409912109375, 0.8358154296875, 0.8864898681640625, 0.937164306640625, 0.9878387451171875, 1.03851318359375, 1.0891876220703125, 1.139862060546875, 1.1905364990234375, 1.2412109375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 8.0, 9.0, 4.0, 12.0, 9.0, 12.0, 14.0, 17.0, 17.0, 16.0, 28.0, 35.0, 48.0, 49.0, 48.0, 65.0, 67.0, 64.0, 59.0, 56.0, 60.0, 53.0, 38.0, 30.0, 29.0, 21.0, 21.0, 7.0, 8.0, 18.0, 7.0, 9.0, 6.0, 9.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.0006456375122070312, -0.0006269291043281555, -0.0006082206964492798, -0.000589512288570404, -0.0005708038806915283, -0.0005520954728126526, -0.0005333870649337769, -0.0005146786570549011, -0.0004959702491760254, -0.00047726184129714966, -0.0004585534334182739, -0.0004398450255393982, -0.00042113661766052246, -0.00040242820978164673, -0.000383719801902771, -0.00036501139402389526, -0.00034630298614501953, -0.0003275945782661438, -0.00030888617038726807, -0.00029017776250839233, -0.0002714693546295166, -0.00025276094675064087, -0.00023405253887176514, -0.0002153441309928894, -0.00019663572311401367, -0.00017792731523513794, -0.0001592189073562622, -0.00014051049947738647, -0.00012180209159851074, -0.00010309368371963501, -8.438527584075928e-05, -6.567686796188354e-05, -4.696846008300781e-05, -2.826005220413208e-05, -9.551644325256348e-06, 9.156763553619385e-06, 2.7865171432495117e-05, 4.657357931137085e-05, 6.528198719024658e-05, 8.399039506912231e-05, 0.00010269880294799805, 0.00012140721082687378, 0.0001401156187057495, 0.00015882402658462524, 0.00017753243446350098, 0.0001962408423423767, 0.00021494925022125244, 0.00023365765810012817, 0.0002523660659790039, 0.00027107447385787964, 0.00028978288173675537, 0.0003084912896156311, 0.00032719969749450684, 0.00034590810537338257, 0.0003646165132522583, 0.00038332492113113403, 0.00040203332901000977, 0.0004207417368888855, 0.00043945014476776123, 0.00045815855264663696, 0.0004768669605255127, 0.0004955753684043884, 0.0005142837762832642, 0.0005329921841621399, 0.0005517005920410156]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 1.0, 10.0, 9.0, 7.0, 7.0, 13.0, 23.0, 22.0, 27.0, 41.0, 50.0, 94.0, 114.0, 159.0, 318.0, 732.0, 34941.0, 1008809.0, 1937.0, 470.0, 247.0, 134.0, 110.0, 75.0, 37.0, 23.0, 22.0, 19.0, 15.0, 13.0, 14.0, 12.0, 10.0, 6.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01361846923828125, -0.01315319538116455, -0.012687921524047852, -0.012222647666931152, -0.011757373809814453, -0.011292099952697754, -0.010826826095581055, -0.010361552238464355, -0.009896278381347656, -0.009431004524230957, -0.008965730667114258, -0.008500456809997559, -0.00803518295288086, -0.00756990909576416, -0.007104635238647461, -0.006639361381530762, -0.0061740875244140625, -0.005708813667297363, -0.005243539810180664, -0.004778265953063965, -0.004312992095947266, -0.0038477182388305664, -0.003382444381713867, -0.002917170524597168, -0.0024518966674804688, -0.0019866228103637695, -0.0015213489532470703, -0.001056075096130371, -0.0005908012390136719, -0.00012552738189697266, 0.00033974647521972656, 0.0008050203323364258, 0.001270294189453125, 0.0017355680465698242, 0.0022008419036865234, 0.0026661157608032227, 0.003131389617919922, 0.003596663475036621, 0.00406193733215332, 0.0045272111892700195, 0.004992485046386719, 0.005457758903503418, 0.005923032760620117, 0.006388306617736816, 0.006853580474853516, 0.007318854331970215, 0.007784128189086914, 0.008249402046203613, 0.008714675903320312, 0.009179949760437012, 0.009645223617553711, 0.01011049747467041, 0.01057577133178711, 0.011041045188903809, 0.011506319046020508, 0.011971592903137207, 0.012436866760253906, 0.012902140617370605, 0.013367414474487305, 0.013832688331604004, 0.014297962188720703, 0.014763236045837402, 0.015228509902954102, 0.0156937837600708, 0.0161590576171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 44.0, 138.0, 313.0, 335.0, 135.0, 29.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001122990157455206, -0.001087884302251041, -0.0010527785634621978, -0.0010176727082580328, -0.0009825669694691896, -0.0009474611142650247, -0.0009123553172685206, -0.0008772495202720165, -0.0008421437232755125, -0.0008070379262790084, -0.0007719321292825043, -0.0007368263322860003, -0.0007017204770818353, -0.0006666147382929921, -0.0006315088830888271, -0.0005964030860923231, -0.000561297289095819, -0.0005261914920993149, -0.0004910856951028109, -0.00045597986900247633, -0.00042087407200597227, -0.0003857682750094682, -0.00035066244890913367, -0.0003155566519126296, -0.00028045085491612554, -0.00024534505791962147, -0.00021023924637120217, -0.00017513343482278287, -0.0001400276378262788, -0.00010492184082977474, -6.981602928135544e-05, -3.4710217732936144e-05, 3.9569567888975143e-07, 3.5501499951351434e-05, 7.060730422381312e-05, 0.0001057131084962748, 0.00014081891276873648, 0.00017592470976524055, 0.00021103052131365985, 0.00024613633286207914, 0.0002812421298585832, 0.0003163479268550873, 0.00035145372385159135, 0.0003865595499519259, 0.00042166534694842994, 0.000456771143944934, 0.0004918769700452685, 0.0005269827670417726, 0.0005620885640382767, 0.0005971943610347807, 0.0006323001580312848, 0.0006674059550277889, 0.000702511752024293, 0.0007376176072284579, 0.000772723404224962, 0.0008078292012214661, 0.0008429349982179701, 0.0008780407952144742, 0.0009131465922109783, 0.0009482523892074823, 0.0009833582444116473, 0.0010184639832004905, 0.0010535698384046555, 0.0010886755771934986, 0.0011237814323976636]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 3.0, 5.0, 11.0, 10.0, 8.0, 13.0, 19.0, 17.0, 25.0, 31.0, 32.0, 26.0, 37.0, 38.0, 32.0, 40.0, 57.0, 41.0, 35.0, 33.0, 52.0, 40.0, 32.0, 32.0, 36.0, 38.0, 31.0, 26.0, 37.0, 15.0, 30.0, 19.0, 25.0, 14.0, 16.0, 14.0, 6.0, 6.0, 5.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00038444995880126953, -0.000373070128262043, -0.00036169029772281647, -0.00035031046718358994, -0.0003389306366443634, -0.00032755080610513687, -0.00031617097556591034, -0.0003047911450266838, -0.0002934113144874573, -0.00028203148394823074, -0.0002706516534090042, -0.0002592718228697777, -0.00024789199233055115, -0.00023651216179132462, -0.00022513233125209808, -0.00021375250071287155, -0.00020237267017364502, -0.0001909928396344185, -0.00017961300909519196, -0.00016823317855596542, -0.0001568533480167389, -0.00014547351747751236, -0.00013409368693828583, -0.0001227138563990593, -0.00011133402585983276, -9.995419532060623e-05, -8.85743647813797e-05, -7.719453424215317e-05, -6.581470370292664e-05, -5.4434873163700104e-05, -4.305504262447357e-05, -3.167521208524704e-05, -2.0295381546020508e-05, -8.915551006793976e-06, 2.464279532432556e-06, 1.3844110071659088e-05, 2.522394061088562e-05, 3.660377115011215e-05, 4.7983601689338684e-05, 5.9363432228565216e-05, 7.074326276779175e-05, 8.212309330701828e-05, 9.350292384624481e-05, 0.00010488275438547134, 0.00011626258492469788, 0.0001276424154639244, 0.00013902224600315094, 0.00015040207654237747, 0.000161781907081604, 0.00017316173762083054, 0.00018454156816005707, 0.0001959213986992836, 0.00020730122923851013, 0.00021868105977773666, 0.0002300608903169632, 0.00024144072085618973, 0.00025282055139541626, 0.0002642003819346428, 0.0002755802124738693, 0.00028696004301309586, 0.0002983398735523224, 0.0003097197040915489, 0.00032109953463077545, 0.000332479365170002, 0.0003438591957092285]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 5.0, 3.0, 4.0, 7.0, 9.0, 13.0, 10.0, 18.0, 12.0, 12.0, 15.0, 25.0, 20.0, 25.0, 31.0, 26.0, 26.0, 34.0, 36.0, 33.0, 32.0, 47.0, 31.0, 38.0, 39.0, 36.0, 30.0, 37.0, 25.0, 35.0, 29.0, 26.0, 21.0, 26.0, 21.0, 32.0, 20.0, 17.0, 15.0, 25.0, 8.0, 13.0, 9.0, 6.0, 6.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.93359375, -3.80511474609375, -3.6766357421875, -3.54815673828125, -3.419677734375, -3.29119873046875, -3.1627197265625, -3.03424072265625, -2.90576171875, -2.77728271484375, -2.6488037109375, -2.52032470703125, -2.391845703125, -2.26336669921875, -2.1348876953125, -2.00640869140625, -1.8779296875, -1.74945068359375, -1.6209716796875, -1.49249267578125, -1.364013671875, -1.23553466796875, -1.1070556640625, -0.97857666015625, -0.85009765625, -0.72161865234375, -0.5931396484375, -0.46466064453125, -0.336181640625, -0.20770263671875, -0.0792236328125, 0.04925537109375, 0.177734375, 0.30621337890625, 0.4346923828125, 0.56317138671875, 0.691650390625, 0.82012939453125, 0.9486083984375, 1.07708740234375, 1.20556640625, 1.33404541015625, 1.4625244140625, 1.59100341796875, 1.719482421875, 1.84796142578125, 1.9764404296875, 2.10491943359375, 2.2333984375, 2.36187744140625, 2.4903564453125, 2.61883544921875, 2.747314453125, 2.87579345703125, 3.0042724609375, 3.13275146484375, 3.26123046875, 3.38970947265625, 3.5181884765625, 3.64666748046875, 3.775146484375, 3.90362548828125, 4.0321044921875, 4.16058349609375, 4.2890625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 7.0, 4.0, 9.0, 7.0, 15.0, 17.0, 17.0, 25.0, 28.0, 32.0, 59.0, 106.0, 152.0, 294.0, 538.0, 1014.0, 2127.0, 4454.0, 9842.0, 23409.0, 59554.0, 158245.0, 364121.0, 260605.0, 97764.0, 37838.0, 15158.0, 6676.0, 3047.0, 1566.0, 785.0, 404.0, 227.0, 127.0, 77.0, 52.0, 36.0, 24.0, 20.0, 15.0, 12.0, 10.0, 12.0, 7.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.43194580078125, -2.3502197265625, -2.26849365234375, -2.186767578125, -2.10504150390625, -2.0233154296875, -1.94158935546875, -1.85986328125, -1.77813720703125, -1.6964111328125, -1.61468505859375, -1.532958984375, -1.45123291015625, -1.3695068359375, -1.28778076171875, -1.2060546875, -1.12432861328125, -1.0426025390625, -0.96087646484375, -0.879150390625, -0.79742431640625, -0.7156982421875, -0.63397216796875, -0.55224609375, -0.47052001953125, -0.3887939453125, -0.30706787109375, -0.225341796875, -0.14361572265625, -0.0618896484375, 0.01983642578125, 0.1015625, 0.18328857421875, 0.2650146484375, 0.34674072265625, 0.428466796875, 0.51019287109375, 0.5919189453125, 0.67364501953125, 0.75537109375, 0.83709716796875, 0.9188232421875, 1.00054931640625, 1.082275390625, 1.16400146484375, 1.2457275390625, 1.32745361328125, 1.4091796875, 1.49090576171875, 1.5726318359375, 1.65435791015625, 1.736083984375, 1.81781005859375, 1.8995361328125, 1.98126220703125, 2.06298828125, 2.14471435546875, 2.2264404296875, 2.30816650390625, 2.389892578125, 2.47161865234375, 2.5533447265625, 2.63507080078125, 2.716796875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 4.0, 1.0, 8.0, 7.0, 13.0, 7.0, 10.0, 10.0, 8.0, 12.0, 16.0, 28.0, 19.0, 27.0, 26.0, 30.0, 39.0, 39.0, 39.0, 47.0, 92.0, 268.0, 1700.0, 114.0, 63.0, 41.0, 44.0, 30.0, 36.0, 41.0, 28.0, 28.0, 23.0, 30.0, 25.0, 18.0, 17.0, 16.0, 5.0, 13.0, 8.0, 6.0, 4.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.2109375, -13.7247314453125, -13.238525390625, -12.7523193359375, -12.26611328125, -11.7799072265625, -11.293701171875, -10.8074951171875, -10.3212890625, -9.8350830078125, -9.348876953125, -8.8626708984375, -8.37646484375, -7.8902587890625, -7.404052734375, -6.9178466796875, -6.431640625, -5.9454345703125, -5.459228515625, -4.9730224609375, -4.48681640625, -4.0006103515625, -3.514404296875, -3.0281982421875, -2.5419921875, -2.0557861328125, -1.569580078125, -1.0833740234375, -0.59716796875, -0.1109619140625, 0.375244140625, 0.8614501953125, 1.34765625, 1.8338623046875, 2.320068359375, 2.8062744140625, 3.29248046875, 3.7786865234375, 4.264892578125, 4.7510986328125, 5.2373046875, 5.7235107421875, 6.209716796875, 6.6959228515625, 7.18212890625, 7.6683349609375, 8.154541015625, 8.6407470703125, 9.126953125, 9.6131591796875, 10.099365234375, 10.5855712890625, 11.07177734375, 11.5579833984375, 12.044189453125, 12.5303955078125, 13.0166015625, 13.5028076171875, 13.989013671875, 14.4752197265625, 14.96142578125, 15.4476318359375, 15.933837890625, 16.4200439453125, 16.90625]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 3.0, 4.0, 7.0, 12.0, 6.0, 9.0, 12.0, 25.0, 20.0, 23.0, 34.0, 31.0, 41.0, 58.0, 84.0, 104.0, 175.0, 280.0, 526.0, 1590.0, 19052.0, 3070136.0, 49741.0, 2194.0, 619.0, 299.0, 160.0, 124.0, 77.0, 55.0, 42.0, 28.0, 27.0, 16.0, 12.0, 12.0, 10.0, 13.0, 7.0, 14.0, 4.0, 5.0, 3.0, 4.0, 3.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.421875, -27.600341796875, -26.77880859375, -25.957275390625, -25.1357421875, -24.314208984375, -23.49267578125, -22.671142578125, -21.849609375, -21.028076171875, -20.20654296875, -19.385009765625, -18.5634765625, -17.741943359375, -16.92041015625, -16.098876953125, -15.27734375, -14.455810546875, -13.63427734375, -12.812744140625, -11.9912109375, -11.169677734375, -10.34814453125, -9.526611328125, -8.705078125, -7.883544921875, -7.06201171875, -6.240478515625, -5.4189453125, -4.597412109375, -3.77587890625, -2.954345703125, -2.1328125, -1.311279296875, -0.48974609375, 0.331787109375, 1.1533203125, 1.974853515625, 2.79638671875, 3.617919921875, 4.439453125, 5.260986328125, 6.08251953125, 6.904052734375, 7.7255859375, 8.547119140625, 9.36865234375, 10.190185546875, 11.01171875, 11.833251953125, 12.65478515625, 13.476318359375, 14.2978515625, 15.119384765625, 15.94091796875, 16.762451171875, 17.583984375, 18.405517578125, 19.22705078125, 20.048583984375, 20.8701171875, 21.691650390625, 22.51318359375, 23.334716796875, 24.15625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 708.0, 306.0], "bins": [-385.0814208984375, -378.9547119140625, -372.8280029296875, -366.7013244628906, -360.5746154785156, -354.4479064941406, -348.3211975097656, -342.1944885253906, -336.06781005859375, -329.94110107421875, -323.81439208984375, -317.6877136230469, -311.5610046386719, -305.4342956542969, -299.3075866699219, -293.1808776855469, -287.0541687011719, -280.9274597167969, -274.8007507324219, -268.674072265625, -262.54736328125, -256.420654296875, -250.2939453125, -244.167236328125, -238.04054260253906, -231.91383361816406, -225.78713989257812, -219.66043090820312, -213.53372192382812, -207.4070281982422, -201.2803192138672, -195.15362548828125, -189.0269317626953, -182.9002227783203, -176.77352905273438, -170.64682006835938, -164.52011108398438, -158.39341735839844, -152.26670837402344, -146.1400146484375, -140.0133056640625, -133.8865966796875, -127.75990295410156, -121.63319396972656, -115.5064926147461, -109.37979125976562, -103.25308227539062, -97.12638092041016, -90.99967956542969, -84.87297821044922, -78.74627685546875, -72.61956787109375, -66.49286651611328, -60.36616516113281, -54.23945999145508, -48.112754821777344, -41.986053466796875, -35.859352111816406, -29.732646942138672, -23.60594367980957, -17.47924041748047, -11.352537155151367, -5.225833892822266, 0.9008712768554688, 7.027574062347412]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 3.0, 4.0, 10.0, 13.0, 19.0, 16.0, 20.0, 21.0, 13.0, 24.0, 30.0, 32.0, 40.0, 37.0, 40.0, 32.0, 49.0, 47.0, 58.0, 33.0, 46.0, 49.0, 37.0, 42.0, 33.0, 37.0, 31.0, 25.0, 19.0, 26.0, 17.0, 14.0, 17.0, 17.0, 9.0, 7.0, 8.0, 8.0, 7.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.77760314941406, -48.086917877197266, -46.3962287902832, -44.705543518066406, -43.014854431152344, -41.32416915893555, -39.63348388671875, -37.94279479980469, -36.25210952758789, -34.561424255371094, -32.87073516845703, -31.180049896240234, -29.489362716674805, -27.798675537109375, -26.107990264892578, -24.41730308532715, -22.72661590576172, -21.03592872619629, -19.34524154663086, -17.654556274414062, -15.963869094848633, -14.273181915283203, -12.58249568939209, -10.891809463500977, -9.201122283935547, -7.510435581207275, -5.819748878479004, -4.129062175750732, -2.438375473022461, -0.7476882934570312, 0.942997932434082, 2.6336841583251953, 4.324371337890625, 6.0150580406188965, 7.705744743347168, 9.396430969238281, 11.087118148803711, 12.77780532836914, 14.468491554260254, 16.159177780151367, 17.849864959716797, 19.540552139282227, 21.231239318847656, 22.921924591064453, 24.612611770629883, 26.303298950195312, 27.99398422241211, 29.68467140197754, 31.37535858154297, 33.066043853759766, 34.75673294067383, 36.447418212890625, 38.13810729980469, 39.828792572021484, 41.51947784423828, 43.210166931152344, 44.90085220336914, 46.59153747558594, 48.2822265625, 49.9729118347168, 51.663597106933594, 53.354286193847656, 55.04497146606445, 56.73565673828125, 58.42634582519531]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 4.0, 4.0, 1.0, 5.0, 9.0, 8.0, 5.0, 10.0, 13.0, 13.0, 12.0, 17.0, 13.0, 19.0, 21.0, 29.0, 33.0, 26.0, 29.0, 31.0, 34.0, 34.0, 30.0, 50.0, 31.0, 31.0, 34.0, 37.0, 39.0, 35.0, 27.0, 37.0, 35.0, 20.0, 18.0, 30.0, 22.0, 23.0, 22.0, 18.0, 19.0, 15.0, 17.0, 7.0, 5.0, 10.0, 9.0, 6.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.125, -3.99493408203125, -3.8648681640625, -3.73480224609375, -3.604736328125, -3.47467041015625, -3.3446044921875, -3.21453857421875, -3.08447265625, -2.95440673828125, -2.8243408203125, -2.69427490234375, -2.564208984375, -2.43414306640625, -2.3040771484375, -2.17401123046875, -2.0439453125, -1.91387939453125, -1.7838134765625, -1.65374755859375, -1.523681640625, -1.39361572265625, -1.2635498046875, -1.13348388671875, -1.00341796875, -0.87335205078125, -0.7432861328125, -0.61322021484375, -0.483154296875, -0.35308837890625, -0.2230224609375, -0.09295654296875, 0.037109375, 0.16717529296875, 0.2972412109375, 0.42730712890625, 0.557373046875, 0.68743896484375, 0.8175048828125, 0.94757080078125, 1.07763671875, 1.20770263671875, 1.3377685546875, 1.46783447265625, 1.597900390625, 1.72796630859375, 1.8580322265625, 1.98809814453125, 2.1181640625, 2.24822998046875, 2.3782958984375, 2.50836181640625, 2.638427734375, 2.76849365234375, 2.8985595703125, 3.02862548828125, 3.15869140625, 3.28875732421875, 3.4188232421875, 3.54888916015625, 3.678955078125, 3.80902099609375, 3.9390869140625, 4.06915283203125, 4.19921875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 5.0, 8.0, 3.0, 7.0, 16.0, 13.0, 12.0, 20.0, 20.0, 24.0, 30.0, 47.0, 39.0, 75.0, 118.0, 182.0, 432.0, 1630.0, 12712.0, 189137.0, 2873631.0, 1066454.0, 43623.0, 4409.0, 850.0, 274.0, 133.0, 85.0, 58.0, 44.0, 33.0, 31.0, 28.0, 22.0, 20.0, 13.0, 8.0, 6.0, 10.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046875, -14.5576171875, -14.068359375, -13.5791015625, -13.08984375, -12.6005859375, -12.111328125, -11.6220703125, -11.1328125, -10.6435546875, -10.154296875, -9.6650390625, -9.17578125, -8.6865234375, -8.197265625, -7.7080078125, -7.21875, -6.7294921875, -6.240234375, -5.7509765625, -5.26171875, -4.7724609375, -4.283203125, -3.7939453125, -3.3046875, -2.8154296875, -2.326171875, -1.8369140625, -1.34765625, -0.8583984375, -0.369140625, 0.1201171875, 0.609375, 1.0986328125, 1.587890625, 2.0771484375, 2.56640625, 3.0556640625, 3.544921875, 4.0341796875, 4.5234375, 5.0126953125, 5.501953125, 5.9912109375, 6.48046875, 6.9697265625, 7.458984375, 7.9482421875, 8.4375, 8.9267578125, 9.416015625, 9.9052734375, 10.39453125, 10.8837890625, 11.373046875, 11.8623046875, 12.3515625, 12.8408203125, 13.330078125, 13.8193359375, 14.30859375, 14.7978515625, 15.287109375, 15.7763671875, 16.265625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 6.0, 13.0, 13.0, 17.0, 27.0, 31.0, 42.0, 56.0, 66.0, 87.0, 111.0, 135.0, 204.0, 218.0, 265.0, 327.0, 368.0, 368.0, 350.0, 277.0, 254.0, 211.0, 136.0, 115.0, 87.0, 74.0, 46.0, 41.0, 32.0, 25.0, 21.0, 7.0, 9.0, 12.0, 6.0, 2.0, 2.0, 3.0, 0.0, 0.0, 5.0, 0.0, 1.0], "bins": [-13.203125, -12.855712890625, -12.50830078125, -12.160888671875, -11.8134765625, -11.466064453125, -11.11865234375, -10.771240234375, -10.423828125, -10.076416015625, -9.72900390625, -9.381591796875, -9.0341796875, -8.686767578125, -8.33935546875, -7.991943359375, -7.64453125, -7.297119140625, -6.94970703125, -6.602294921875, -6.2548828125, -5.907470703125, -5.56005859375, -5.212646484375, -4.865234375, -4.517822265625, -4.17041015625, -3.822998046875, -3.4755859375, -3.128173828125, -2.78076171875, -2.433349609375, -2.0859375, -1.738525390625, -1.39111328125, -1.043701171875, -0.6962890625, -0.348876953125, -0.00146484375, 0.345947265625, 0.693359375, 1.040771484375, 1.38818359375, 1.735595703125, 2.0830078125, 2.430419921875, 2.77783203125, 3.125244140625, 3.47265625, 3.820068359375, 4.16748046875, 4.514892578125, 4.8623046875, 5.209716796875, 5.55712890625, 5.904541015625, 6.251953125, 6.599365234375, 6.94677734375, 7.294189453125, 7.6416015625, 7.989013671875, 8.33642578125, 8.683837890625, 9.03125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 5.0, 6.0, 17.0, 11.0, 16.0, 33.0, 36.0, 51.0, 76.0, 115.0, 167.0, 244.0, 470.0, 1292.0, 42964.0, 4059306.0, 86565.0, 1638.0, 453.0, 253.0, 170.0, 115.0, 87.0, 48.0, 39.0, 31.0, 22.0, 17.0, 14.0, 9.0, 4.0, 2.0, 4.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.96875, -41.21923828125, -39.4697265625, -37.72021484375, -35.970703125, -34.22119140625, -32.4716796875, -30.72216796875, -28.97265625, -27.22314453125, -25.4736328125, -23.72412109375, -21.974609375, -20.22509765625, -18.4755859375, -16.72607421875, -14.9765625, -13.22705078125, -11.4775390625, -9.72802734375, -7.978515625, -6.22900390625, -4.4794921875, -2.72998046875, -0.98046875, 0.76904296875, 2.5185546875, 4.26806640625, 6.017578125, 7.76708984375, 9.5166015625, 11.26611328125, 13.015625, 14.76513671875, 16.5146484375, 18.26416015625, 20.013671875, 21.76318359375, 23.5126953125, 25.26220703125, 27.01171875, 28.76123046875, 30.5107421875, 32.26025390625, 34.009765625, 35.75927734375, 37.5087890625, 39.25830078125, 41.0078125, 42.75732421875, 44.5068359375, 46.25634765625, 48.005859375, 49.75537109375, 51.5048828125, 53.25439453125, 55.00390625, 56.75341796875, 58.5029296875, 60.25244140625, 62.001953125, 63.75146484375, 65.5009765625, 67.25048828125, 69.0]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 7.0, 28.0, 59.0, 93.0, 138.0, 187.0, 184.0, 149.0, 85.0, 46.0, 22.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-129.93470764160156, -127.47964477539062, -125.02458190917969, -122.56951141357422, -120.11444854736328, -117.65938568115234, -115.2043228149414, -112.74925231933594, -110.294189453125, -107.83912658691406, -105.38406372070312, -102.92899322509766, -100.47393035888672, -98.01886749267578, -95.56380462646484, -93.10873413085938, -90.65367126464844, -88.1986083984375, -85.74354553222656, -83.2884750366211, -80.83341217041016, -78.37834930419922, -75.92328643798828, -73.46821594238281, -71.0131607055664, -68.55809783935547, -66.10303497314453, -63.64796829223633, -61.192901611328125, -58.73783874511719, -56.28277587890625, -53.82770919799805, -51.372642517089844, -48.917579650878906, -46.4625129699707, -44.007450103759766, -41.55238342285156, -39.097320556640625, -36.64225769042969, -34.187191009521484, -31.732126235961914, -29.277061462402344, -26.821996688842773, -24.366931915283203, -21.911869049072266, -19.456802368164062, -17.001739501953125, -14.546674728393555, -12.091609954833984, -9.636545181274414, -7.181480884552002, -4.72641658782959, -2.2713518142700195, 0.18371295928955078, 2.6387767791748047, 5.093841552734375, 7.548906326293945, 10.003971099853516, 12.459035873413086, 14.91409969329834, 17.369163513183594, 19.824230194091797, 22.279293060302734, 24.734357833862305, 27.189422607421875]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 7.0, 4.0, 3.0, 4.0, 7.0, 12.0, 17.0, 11.0, 15.0, 10.0, 8.0, 18.0, 26.0, 24.0, 28.0, 39.0, 26.0, 34.0, 30.0, 43.0, 45.0, 31.0, 44.0, 34.0, 39.0, 48.0, 32.0, 34.0, 32.0, 40.0, 42.0, 32.0, 31.0, 30.0, 18.0, 19.0, 12.0, 13.0, 11.0, 10.0, 9.0, 9.0, 4.0, 5.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.14979553222656, -35.78934097290039, -34.42888641357422, -33.06843185424805, -31.707977294921875, -30.347522735595703, -28.987070083618164, -27.626615524291992, -26.26616096496582, -24.90570640563965, -23.545251846313477, -22.184799194335938, -20.824344635009766, -19.463890075683594, -18.103435516357422, -16.74298095703125, -15.382526397705078, -14.022071838378906, -12.661617279052734, -11.301163673400879, -9.940709114074707, -8.580254554748535, -7.21980094909668, -5.859346389770508, -4.498891830444336, -3.138437509536743, -1.7779831886291504, -0.4175291061401367, 0.9429254531860352, 2.303380012512207, 3.6638336181640625, 5.024288177490234, 6.384742736816406, 7.745197296142578, 9.10565185546875, 10.466105461120605, 11.826560020446777, 13.18701457977295, 14.547468185424805, 15.907922744750977, 17.26837730407715, 18.62883186340332, 19.989286422729492, 21.34973907470703, 22.710193634033203, 24.070648193359375, 25.431102752685547, 26.79155731201172, 28.15201187133789, 29.512466430664062, 30.872920989990234, 32.233375549316406, 33.59383010864258, 34.95428466796875, 36.314735412597656, 37.675193786621094, 39.03564453125, 40.39609909057617, 41.756553649902344, 43.117008209228516, 44.47746276855469, 45.83791732788086, 47.19837188720703, 48.55882263183594, 49.919281005859375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 12.0, 12.0, 11.0, 12.0, 14.0, 13.0, 13.0, 23.0, 19.0, 27.0, 23.0, 39.0, 39.0, 42.0, 27.0, 38.0, 27.0, 38.0, 46.0, 35.0, 38.0, 39.0, 39.0, 29.0, 33.0, 42.0, 23.0, 30.0, 25.0, 26.0, 27.0, 20.0, 17.0, 23.0, 9.0, 12.0, 11.0, 10.0, 7.0, 5.0, 2.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.93359375, -4.7896728515625, -4.645751953125, -4.5018310546875, -4.35791015625, -4.2139892578125, -4.070068359375, -3.9261474609375, -3.7822265625, -3.6383056640625, -3.494384765625, -3.3504638671875, -3.20654296875, -3.0626220703125, -2.918701171875, -2.7747802734375, -2.630859375, -2.4869384765625, -2.343017578125, -2.1990966796875, -2.05517578125, -1.9112548828125, -1.767333984375, -1.6234130859375, -1.4794921875, -1.3355712890625, -1.191650390625, -1.0477294921875, -0.90380859375, -0.7598876953125, -0.615966796875, -0.4720458984375, -0.328125, -0.1842041015625, -0.040283203125, 0.1036376953125, 0.24755859375, 0.3914794921875, 0.535400390625, 0.6793212890625, 0.8232421875, 0.9671630859375, 1.111083984375, 1.2550048828125, 1.39892578125, 1.5428466796875, 1.686767578125, 1.8306884765625, 1.974609375, 2.1185302734375, 2.262451171875, 2.4063720703125, 2.55029296875, 2.6942138671875, 2.838134765625, 2.9820556640625, 3.1259765625, 3.2698974609375, 3.413818359375, 3.5577392578125, 3.70166015625, 3.8455810546875, 3.989501953125, 4.1334228515625, 4.27734375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 11.0, 17.0, 25.0, 28.0, 47.0, 67.0, 109.0, 175.0, 236.0, 329.0, 567.0, 766.0, 1065.0, 1675.0, 2396.0, 3459.0, 5109.0, 7425.0, 11058.0, 16105.0, 24936.0, 38396.0, 60764.0, 101236.0, 200345.0, 251228.0, 121109.0, 70671.0, 43856.0, 27917.0, 18502.0, 12304.0, 8486.0, 5757.0, 3951.0, 2609.0, 1851.0, 1316.0, 864.0, 587.0, 400.0, 279.0, 184.0, 100.0, 83.0, 65.0, 33.0, 23.0, 13.0, 9.0, 4.0, 3.0, 8.0, 1.0, 3.0], "bins": [-0.93798828125, -0.9105224609375, -0.883056640625, -0.8555908203125, -0.828125, -0.8006591796875, -0.773193359375, -0.7457275390625, -0.71826171875, -0.6907958984375, -0.663330078125, -0.6358642578125, -0.6083984375, -0.5809326171875, -0.553466796875, -0.5260009765625, -0.49853515625, -0.4710693359375, -0.443603515625, -0.4161376953125, -0.388671875, -0.3612060546875, -0.333740234375, -0.3062744140625, -0.27880859375, -0.2513427734375, -0.223876953125, -0.1964111328125, -0.1689453125, -0.1414794921875, -0.114013671875, -0.0865478515625, -0.05908203125, -0.0316162109375, -0.004150390625, 0.0233154296875, 0.05078125, 0.0782470703125, 0.105712890625, 0.1331787109375, 0.16064453125, 0.1881103515625, 0.215576171875, 0.2430419921875, 0.2705078125, 0.2979736328125, 0.325439453125, 0.3529052734375, 0.38037109375, 0.4078369140625, 0.435302734375, 0.4627685546875, 0.490234375, 0.5177001953125, 0.545166015625, 0.5726318359375, 0.60009765625, 0.6275634765625, 0.655029296875, 0.6824951171875, 0.7099609375, 0.7374267578125, 0.764892578125, 0.7923583984375, 0.81982421875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 4.0, 11.0, 9.0, 10.0, 14.0, 19.0, 16.0, 13.0, 18.0, 26.0, 28.0, 31.0, 33.0, 30.0, 35.0, 29.0, 40.0, 45.0, 43.0, 30.0, 1064.0, 32.0, 41.0, 47.0, 34.0, 26.0, 30.0, 41.0, 27.0, 30.0, 27.0, 17.0, 14.0, 18.0, 12.0, 10.0, 14.0, 7.0, 8.0, 7.0, 4.0, 1.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 4.0], "bins": [-2.9921875, -2.90423583984375, -2.8162841796875, -2.72833251953125, -2.640380859375, -2.55242919921875, -2.4644775390625, -2.37652587890625, -2.28857421875, -2.20062255859375, -2.1126708984375, -2.02471923828125, -1.936767578125, -1.84881591796875, -1.7608642578125, -1.67291259765625, -1.5849609375, -1.49700927734375, -1.4090576171875, -1.32110595703125, -1.233154296875, -1.14520263671875, -1.0572509765625, -0.96929931640625, -0.88134765625, -0.79339599609375, -0.7054443359375, -0.61749267578125, -0.529541015625, -0.44158935546875, -0.3536376953125, -0.26568603515625, -0.177734375, -0.08978271484375, -0.0018310546875, 0.08612060546875, 0.174072265625, 0.26202392578125, 0.3499755859375, 0.43792724609375, 0.52587890625, 0.61383056640625, 0.7017822265625, 0.78973388671875, 0.877685546875, 0.96563720703125, 1.0535888671875, 1.14154052734375, 1.2294921875, 1.31744384765625, 1.4053955078125, 1.49334716796875, 1.581298828125, 1.66925048828125, 1.7572021484375, 1.84515380859375, 1.93310546875, 2.02105712890625, 2.1090087890625, 2.19696044921875, 2.284912109375, 2.37286376953125, 2.4608154296875, 2.54876708984375, 2.63671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 3.0, 3.0, 7.0, 8.0, 1.0, 2.0, 8.0, 7.0, 6.0, 15.0, 23.0, 24.0, 51.0, 95.0, 150.0, 256.0, 491.0, 766.0, 1459.0, 2461.0, 4487.0, 8151.0, 15267.0, 29900.0, 59843.0, 137641.0, 1465930.0, 209418.0, 79732.0, 38331.0, 19431.0, 10337.0, 5597.0, 3099.0, 1713.0, 998.0, 565.0, 354.0, 203.0, 110.0, 63.0, 49.0, 27.0, 10.0, 18.0, 9.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.271484375, -1.2286529541015625, -1.185821533203125, -1.1429901123046875, -1.10015869140625, -1.0573272705078125, -1.014495849609375, -0.9716644287109375, -0.9288330078125, -0.8860015869140625, -0.843170166015625, -0.8003387451171875, -0.75750732421875, -0.7146759033203125, -0.671844482421875, -0.6290130615234375, -0.586181640625, -0.5433502197265625, -0.500518798828125, -0.4576873779296875, -0.41485595703125, -0.3720245361328125, -0.329193115234375, -0.2863616943359375, -0.2435302734375, -0.2006988525390625, -0.157867431640625, -0.1150360107421875, -0.07220458984375, -0.0293731689453125, 0.013458251953125, 0.0562896728515625, 0.09912109375, 0.1419525146484375, 0.184783935546875, 0.2276153564453125, 0.27044677734375, 0.3132781982421875, 0.356109619140625, 0.3989410400390625, 0.4417724609375, 0.4846038818359375, 0.527435302734375, 0.5702667236328125, 0.61309814453125, 0.6559295654296875, 0.698760986328125, 0.7415924072265625, 0.784423828125, 0.8272552490234375, 0.870086669921875, 0.9129180908203125, 0.95574951171875, 0.9985809326171875, 1.041412353515625, 1.0842437744140625, 1.1270751953125, 1.1699066162109375, 1.212738037109375, 1.2555694580078125, 1.29840087890625, 1.3412322998046875, 1.384063720703125, 1.4268951416015625, 1.4697265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 5.0, 1.0, 9.0, 11.0, 15.0, 16.0, 23.0, 32.0, 33.0, 51.0, 55.0, 99.0, 81.0, 95.0, 88.0, 94.0, 70.0, 58.0, 37.0, 28.0, 33.0, 16.0, 12.0, 9.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007257461547851562, -0.0006987899541854858, -0.0006718337535858154, -0.000644877552986145, -0.0006179213523864746, -0.0005909651517868042, -0.0005640089511871338, -0.0005370527505874634, -0.000510096549987793, -0.00048314034938812256, -0.00045618414878845215, -0.00042922794818878174, -0.00040227174758911133, -0.0003753155469894409, -0.0003483593463897705, -0.0003214031457901001, -0.0002944469451904297, -0.0002674907445907593, -0.00024053454399108887, -0.00021357834339141846, -0.00018662214279174805, -0.00015966594219207764, -0.00013270974159240723, -0.00010575354099273682, -7.87973403930664e-05, -5.1841139793395996e-05, -2.4884939193725586e-05, 2.0712614059448242e-06, 2.9027462005615234e-05, 5.5983662605285645e-05, 8.293986320495605e-05, 0.00010989606380462646, 0.00013685226440429688, 0.00016380846500396729, 0.0001907646656036377, 0.0002177208662033081, 0.0002446770668029785, 0.0002716332674026489, 0.00029858946800231934, 0.00032554566860198975, 0.00035250186920166016, 0.00037945806980133057, 0.000406414270401001, 0.0004333704710006714, 0.0004603266716003418, 0.0004872828722000122, 0.0005142390727996826, 0.000541195273399353, 0.0005681514739990234, 0.0005951076745986938, 0.0006220638751983643, 0.0006490200757980347, 0.0006759762763977051, 0.0007029324769973755, 0.0007298886775970459, 0.0007568448781967163, 0.0007838010787963867, 0.0008107572793960571, 0.0008377134799957275, 0.000864669680595398, 0.0008916258811950684, 0.0009185820817947388, 0.0009455382823944092, 0.0009724944829940796, 0.00099945068359375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 8.0, 15.0, 10.0, 20.0, 48.0, 72.0, 121.0, 223.0, 405.0, 1298.0, 1007882.0, 37031.0, 670.0, 306.0, 163.0, 98.0, 47.0, 44.0, 19.0, 19.0, 16.0, 9.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.02313232421875, -0.022503376007080078, -0.021874427795410156, -0.021245479583740234, -0.020616531372070312, -0.01998758316040039, -0.01935863494873047, -0.018729686737060547, -0.018100738525390625, -0.017471790313720703, -0.01684284210205078, -0.01621389389038086, -0.015584945678710938, -0.014955997467041016, -0.014327049255371094, -0.013698101043701172, -0.01306915283203125, -0.012440204620361328, -0.011811256408691406, -0.011182308197021484, -0.010553359985351562, -0.00992441177368164, -0.009295463562011719, -0.008666515350341797, -0.008037567138671875, -0.007408618927001953, -0.006779670715332031, -0.006150722503662109, -0.0055217742919921875, -0.004892826080322266, -0.004263877868652344, -0.003634929656982422, -0.0030059814453125, -0.002377033233642578, -0.0017480850219726562, -0.0011191368103027344, -0.0004901885986328125, 0.00013875961303710938, 0.0007677078247070312, 0.0013966560363769531, 0.002025604248046875, 0.002654552459716797, 0.0032835006713867188, 0.003912448883056641, 0.0045413970947265625, 0.005170345306396484, 0.005799293518066406, 0.006428241729736328, 0.00705718994140625, 0.007686138153076172, 0.008315086364746094, 0.008944034576416016, 0.009572982788085938, 0.01020193099975586, 0.010830879211425781, 0.011459827423095703, 0.012088775634765625, 0.012717723846435547, 0.013346672058105469, 0.01397562026977539, 0.014604568481445312, 0.015233516693115234, 0.015862464904785156, 0.016491413116455078, 0.017120361328125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 23.0, 124.0, 356.0, 394.0, 109.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019988541025668383, -0.0019475888693705201, -0.001896323636174202, -0.001845058286562562, -0.0017937930533662438, -0.0017425278201699257, -0.0016912625869736075, -0.0016399973537772894, -0.0015887320041656494, -0.0015374667709693313, -0.0014862015377730131, -0.0014349361881613731, -0.001383670954965055, -0.0013324057217687368, -0.0012811404885724187, -0.0012298752553761005, -0.0011786099057644606, -0.0011273446725681424, -0.0010760794393718243, -0.0010248140897601843, -0.0009735488565638661, -0.000922283623367548, -0.0008710183901712298, -0.0008197530987672508, -0.0007684879237785935, -0.0007172226905822754, -0.0006659573991782963, -0.0006146921659819782, -0.0005634268745779991, -0.000512161641381681, -0.00046089637908153236, -0.00040963111678138375, -0.0003583658253774047, -0.0003071005630772561, -0.0002558353007771075, -0.0002045700530288741, -0.0001533047907287255, -0.00010203954298049212, -5.077428068034351e-05, 4.909816198050976e-07, 5.1756243919953704e-05, 0.00010302150622010231, 0.00015428676852025092, 0.0002055520162684843, 0.00025681726401671767, 0.0003080825263168663, 0.0003593477886170149, 0.0004106130509171635, 0.0004618783132173121, 0.0005131435464136302, 0.0005644088378176093, 0.0006156740710139275, 0.0006669393624179065, 0.0007182045956142247, 0.0007694698870182037, 0.0008207351202145219, 0.00087200035341084, 0.0009232655866071582, 0.0009745308780111372, 0.0010257961694151163, 0.0010770614026114345, 0.0011283266358077526, 0.0011795918690040708, 0.001230857102200389, 0.0012821224518120289]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 3.0, 13.0, 10.0, 7.0, 14.0, 16.0, 10.0, 19.0, 15.0, 18.0, 25.0, 33.0, 37.0, 39.0, 26.0, 32.0, 33.0, 47.0, 47.0, 42.0, 31.0, 35.0, 35.0, 48.0, 34.0, 39.0, 41.0, 21.0, 33.0, 28.0, 31.0, 19.0, 25.0, 15.0, 13.0, 15.0, 10.0, 8.0, 8.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00031310319900512695, -0.0003028968349099159, -0.0002926904708147049, -0.00028248410671949387, -0.00027227774262428284, -0.0002620713785290718, -0.0002518650144338608, -0.00024165865033864975, -0.00023145228624343872, -0.0002212459221482277, -0.00021103955805301666, -0.00020083319395780563, -0.0001906268298625946, -0.00018042046576738358, -0.00017021410167217255, -0.00016000773757696152, -0.0001498013734817505, -0.00013959500938653946, -0.00012938864529132843, -0.0001191822811961174, -0.00010897591710090637, -9.876955300569534e-05, -8.856318891048431e-05, -7.835682481527328e-05, -6.815046072006226e-05, -5.794409662485123e-05, -4.77377325296402e-05, -3.753136843442917e-05, -2.732500433921814e-05, -1.711864024400711e-05, -6.9122761487960815e-06, 3.2940879464149475e-06, 1.3500452041625977e-05, 2.3706816136837006e-05, 3.3913180232048035e-05, 4.4119544327259064e-05, 5.432590842247009e-05, 6.453227251768112e-05, 7.473863661289215e-05, 8.494500070810318e-05, 9.515136480331421e-05, 0.00010535772889852524, 0.00011556409299373627, 0.0001257704570889473, 0.00013597682118415833, 0.00014618318527936935, 0.00015638954937458038, 0.0001665959134697914, 0.00017680227756500244, 0.00018700864166021347, 0.0001972150057554245, 0.00020742136985063553, 0.00021762773394584656, 0.0002278340980410576, 0.00023804046213626862, 0.00024824682623147964, 0.0002584531903266907, 0.0002686595544219017, 0.00027886591851711273, 0.00028907228261232376, 0.0002992786467075348, 0.0003094850108027458, 0.00031969137489795685, 0.0003298977389931679, 0.0003401041030883789]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 12.0, 12.0, 11.0, 12.0, 14.0, 13.0, 13.0, 23.0, 19.0, 27.0, 23.0, 39.0, 39.0, 42.0, 27.0, 38.0, 27.0, 38.0, 46.0, 35.0, 38.0, 39.0, 39.0, 29.0, 33.0, 42.0, 23.0, 30.0, 25.0, 26.0, 27.0, 20.0, 17.0, 23.0, 9.0, 12.0, 11.0, 10.0, 7.0, 5.0, 2.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.93359375, -4.7896728515625, -4.645751953125, -4.5018310546875, -4.35791015625, -4.2139892578125, -4.070068359375, -3.9261474609375, -3.7822265625, -3.6383056640625, -3.494384765625, -3.3504638671875, -3.20654296875, -3.0626220703125, -2.918701171875, -2.7747802734375, -2.630859375, -2.4869384765625, -2.343017578125, -2.1990966796875, -2.05517578125, -1.9112548828125, -1.767333984375, -1.6234130859375, -1.4794921875, -1.3355712890625, -1.191650390625, -1.0477294921875, -0.90380859375, -0.7598876953125, -0.615966796875, -0.4720458984375, -0.328125, -0.1842041015625, -0.040283203125, 0.1036376953125, 0.24755859375, 0.3914794921875, 0.535400390625, 0.6793212890625, 0.8232421875, 0.9671630859375, 1.111083984375, 1.2550048828125, 1.39892578125, 1.5428466796875, 1.686767578125, 1.8306884765625, 1.974609375, 2.1185302734375, 2.262451171875, 2.4063720703125, 2.55029296875, 2.6942138671875, 2.838134765625, 2.9820556640625, 3.1259765625, 3.2698974609375, 3.413818359375, 3.5577392578125, 3.70166015625, 3.8455810546875, 3.989501953125, 4.1334228515625, 4.27734375]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 3.0, 7.0, 5.0, 12.0, 28.0, 33.0, 51.0, 91.0, 159.0, 229.0, 339.0, 532.0, 850.0, 1295.0, 2087.0, 3306.0, 5583.0, 10222.0, 19988.0, 46529.0, 144029.0, 467985.0, 224953.0, 64790.0, 25469.0, 12669.0, 6895.0, 3842.0, 2375.0, 1512.0, 966.0, 599.0, 410.0, 255.0, 152.0, 113.0, 82.0, 40.0, 32.0, 16.0, 5.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.92578125, -3.788818359375, -3.65185546875, -3.514892578125, -3.3779296875, -3.240966796875, -3.10400390625, -2.967041015625, -2.830078125, -2.693115234375, -2.55615234375, -2.419189453125, -2.2822265625, -2.145263671875, -2.00830078125, -1.871337890625, -1.734375, -1.597412109375, -1.46044921875, -1.323486328125, -1.1865234375, -1.049560546875, -0.91259765625, -0.775634765625, -0.638671875, -0.501708984375, -0.36474609375, -0.227783203125, -0.0908203125, 0.046142578125, 0.18310546875, 0.320068359375, 0.45703125, 0.593994140625, 0.73095703125, 0.867919921875, 1.0048828125, 1.141845703125, 1.27880859375, 1.415771484375, 1.552734375, 1.689697265625, 1.82666015625, 1.963623046875, 2.1005859375, 2.237548828125, 2.37451171875, 2.511474609375, 2.6484375, 2.785400390625, 2.92236328125, 3.059326171875, 3.1962890625, 3.333251953125, 3.47021484375, 3.607177734375, 3.744140625, 3.881103515625, 4.01806640625, 4.155029296875, 4.2919921875, 4.428955078125, 4.56591796875, 4.702880859375, 4.83984375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 8.0, 10.0, 8.0, 9.0, 9.0, 12.0, 13.0, 16.0, 8.0, 15.0, 21.0, 31.0, 41.0, 37.0, 30.0, 47.0, 58.0, 50.0, 84.0, 461.0, 1517.0, 102.0, 53.0, 55.0, 51.0, 38.0, 28.0, 32.0, 32.0, 20.0, 27.0, 13.0, 24.0, 19.0, 10.0, 13.0, 6.0, 7.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-15.7109375, -15.220703125, -14.73046875, -14.240234375, -13.75, -13.259765625, -12.76953125, -12.279296875, -11.7890625, -11.298828125, -10.80859375, -10.318359375, -9.828125, -9.337890625, -8.84765625, -8.357421875, -7.8671875, -7.376953125, -6.88671875, -6.396484375, -5.90625, -5.416015625, -4.92578125, -4.435546875, -3.9453125, -3.455078125, -2.96484375, -2.474609375, -1.984375, -1.494140625, -1.00390625, -0.513671875, -0.0234375, 0.466796875, 0.95703125, 1.447265625, 1.9375, 2.427734375, 2.91796875, 3.408203125, 3.8984375, 4.388671875, 4.87890625, 5.369140625, 5.859375, 6.349609375, 6.83984375, 7.330078125, 7.8203125, 8.310546875, 8.80078125, 9.291015625, 9.78125, 10.271484375, 10.76171875, 11.251953125, 11.7421875, 12.232421875, 12.72265625, 13.212890625, 13.703125, 14.193359375, 14.68359375, 15.173828125, 15.6640625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 8.0, 1.0, 8.0, 5.0, 13.0, 10.0, 20.0, 19.0, 24.0, 36.0, 33.0, 55.0, 59.0, 71.0, 102.0, 172.0, 255.0, 448.0, 1409.0, 14945.0, 2881698.0, 239074.0, 5312.0, 794.0, 363.0, 181.0, 143.0, 118.0, 82.0, 45.0, 31.0, 26.0, 15.0, 20.0, 20.0, 22.0, 16.0, 11.0, 6.0, 9.0, 6.0, 2.0, 6.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-32.09375, -31.144775390625, -30.19580078125, -29.246826171875, -28.2978515625, -27.348876953125, -26.39990234375, -25.450927734375, -24.501953125, -23.552978515625, -22.60400390625, -21.655029296875, -20.7060546875, -19.757080078125, -18.80810546875, -17.859130859375, -16.91015625, -15.961181640625, -15.01220703125, -14.063232421875, -13.1142578125, -12.165283203125, -11.21630859375, -10.267333984375, -9.318359375, -8.369384765625, -7.42041015625, -6.471435546875, -5.5224609375, -4.573486328125, -3.62451171875, -2.675537109375, -1.7265625, -0.777587890625, 0.17138671875, 1.120361328125, 2.0693359375, 3.018310546875, 3.96728515625, 4.916259765625, 5.865234375, 6.814208984375, 7.76318359375, 8.712158203125, 9.6611328125, 10.610107421875, 11.55908203125, 12.508056640625, 13.45703125, 14.406005859375, 15.35498046875, 16.303955078125, 17.2529296875, 18.201904296875, 19.15087890625, 20.099853515625, 21.048828125, 21.997802734375, 22.94677734375, 23.895751953125, 24.8447265625, 25.793701171875, 26.74267578125, 27.691650390625, 28.640625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 24.0, 194.0, 555.0, 216.0, 22.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-147.08242797851562, -144.2819061279297, -141.4813995361328, -138.68087768554688, -135.88035583496094, -133.07984924316406, -130.27932739257812, -127.47881317138672, -124.67829895019531, -121.8777847290039, -119.07726287841797, -116.27674865722656, -113.47623443603516, -110.67572021484375, -107.87519836425781, -105.0746841430664, -102.27416229248047, -99.47364807128906, -96.67312622070312, -93.87261199951172, -91.07209777832031, -88.27157592773438, -85.47106170654297, -82.67054748535156, -79.87002563476562, -77.06951141357422, -74.26898956298828, -71.46847534179688, -68.66796112060547, -65.86744689941406, -63.066925048828125, -60.26641082763672, -57.465904235839844, -54.66538619995117, -51.864871978759766, -49.064353942871094, -46.26383972167969, -43.463321685791016, -40.662803649902344, -37.86228942871094, -35.061771392822266, -32.261253356933594, -29.460739135742188, -26.660221099853516, -23.859704971313477, -21.059188842773438, -18.258670806884766, -15.458154678344727, -12.657638549804688, -9.857122421264648, -7.056605339050293, -4.2560882568359375, -1.4555721282958984, 1.3449440002441406, 4.1454620361328125, 6.945978164672852, 9.74649429321289, 12.54701042175293, 15.347527503967285, 18.14804458618164, 20.94856071472168, 23.74907684326172, 26.54959487915039, 29.35011100769043, 32.15062713623047]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 9.0, 5.0, 11.0, 9.0, 11.0, 13.0, 16.0, 12.0, 19.0, 26.0, 28.0, 32.0, 19.0, 33.0, 23.0, 41.0, 52.0, 42.0, 36.0, 33.0, 49.0, 31.0, 37.0, 38.0, 35.0, 37.0, 36.0, 25.0, 24.0, 31.0, 25.0, 33.0, 22.0, 16.0, 18.0, 13.0, 11.0, 8.0, 7.0, 5.0, 8.0, 6.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-46.02405548095703, -44.578773498535156, -43.13349533081055, -41.68821716308594, -40.24293518066406, -38.79765319824219, -37.35237503051758, -35.90709686279297, -34.461814880371094, -33.01653289794922, -31.57125473022461, -30.125974655151367, -28.680694580078125, -27.235414505004883, -25.79013442993164, -24.3448543548584, -22.899574279785156, -21.454294204711914, -20.009014129638672, -18.56373405456543, -17.118453979492188, -15.673173904418945, -14.227893829345703, -12.782613754272461, -11.337333679199219, -9.892053604125977, -8.446773529052734, -7.001493453979492, -5.55621337890625, -4.110933303833008, -2.6656532287597656, -1.2203731536865234, 0.22490692138671875, 1.670186996459961, 3.115467071533203, 4.560747146606445, 6.0060272216796875, 7.45130729675293, 8.896587371826172, 10.341867446899414, 11.787147521972656, 13.232427597045898, 14.67770767211914, 16.122987747192383, 17.568267822265625, 19.013547897338867, 20.45882797241211, 21.90410804748535, 23.349388122558594, 24.794668197631836, 26.239948272705078, 27.68522834777832, 29.130508422851562, 30.575788497924805, 32.02106857299805, 33.466346740722656, 34.91162872314453, 36.356910705566406, 37.802188873291016, 39.247467041015625, 40.6927490234375, 42.138031005859375, 43.583309173583984, 45.028587341308594, 46.47386932373047]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 2.0, 5.0, 3.0, 11.0, 13.0, 12.0, 13.0, 11.0, 14.0, 11.0, 17.0, 32.0, 24.0, 40.0, 27.0, 34.0, 32.0, 34.0, 38.0, 44.0, 39.0, 37.0, 35.0, 37.0, 40.0, 34.0, 26.0, 33.0, 41.0, 20.0, 28.0, 31.0, 30.0, 25.0, 22.0, 13.0, 15.0, 12.0, 21.0, 11.0, 8.0, 8.0, 7.0, 2.0, 4.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.98046875, -4.83099365234375, -4.6815185546875, -4.53204345703125, -4.382568359375, -4.23309326171875, -4.0836181640625, -3.93414306640625, -3.78466796875, -3.63519287109375, -3.4857177734375, -3.33624267578125, -3.186767578125, -3.03729248046875, -2.8878173828125, -2.73834228515625, -2.5888671875, -2.43939208984375, -2.2899169921875, -2.14044189453125, -1.990966796875, -1.84149169921875, -1.6920166015625, -1.54254150390625, -1.39306640625, -1.24359130859375, -1.0941162109375, -0.94464111328125, -0.795166015625, -0.64569091796875, -0.4962158203125, -0.34674072265625, -0.197265625, -0.04779052734375, 0.1016845703125, 0.25115966796875, 0.400634765625, 0.55010986328125, 0.6995849609375, 0.84906005859375, 0.99853515625, 1.14801025390625, 1.2974853515625, 1.44696044921875, 1.596435546875, 1.74591064453125, 1.8953857421875, 2.04486083984375, 2.1943359375, 2.34381103515625, 2.4932861328125, 2.64276123046875, 2.792236328125, 2.94171142578125, 3.0911865234375, 3.24066162109375, 3.39013671875, 3.53961181640625, 3.6890869140625, 3.83856201171875, 3.988037109375, 4.13751220703125, 4.2869873046875, 4.43646240234375, 4.5859375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 6.0, 3.0, 7.0, 8.0, 8.0, 17.0, 33.0, 39.0, 51.0, 85.0, 131.0, 217.0, 359.0, 751.0, 1518.0, 3963.0, 11771.0, 45125.0, 237263.0, 1098257.0, 1838240.0, 765941.0, 146035.0, 30089.0, 8633.0, 2968.0, 1265.0, 589.0, 322.0, 213.0, 128.0, 89.0, 51.0, 38.0, 21.0, 19.0, 9.0, 6.0, 5.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.5, -8.2662353515625, -8.032470703125, -7.7987060546875, -7.56494140625, -7.3311767578125, -7.097412109375, -6.8636474609375, -6.6298828125, -6.3961181640625, -6.162353515625, -5.9285888671875, -5.69482421875, -5.4610595703125, -5.227294921875, -4.9935302734375, -4.759765625, -4.5260009765625, -4.292236328125, -4.0584716796875, -3.82470703125, -3.5909423828125, -3.357177734375, -3.1234130859375, -2.8896484375, -2.6558837890625, -2.422119140625, -2.1883544921875, -1.95458984375, -1.7208251953125, -1.487060546875, -1.2532958984375, -1.01953125, -0.7857666015625, -0.552001953125, -0.3182373046875, -0.08447265625, 0.1492919921875, 0.383056640625, 0.6168212890625, 0.8505859375, 1.0843505859375, 1.318115234375, 1.5518798828125, 1.78564453125, 2.0194091796875, 2.253173828125, 2.4869384765625, 2.720703125, 2.9544677734375, 3.188232421875, 3.4219970703125, 3.65576171875, 3.8895263671875, 4.123291015625, 4.3570556640625, 4.5908203125, 4.8245849609375, 5.058349609375, 5.2921142578125, 5.52587890625, 5.7596435546875, 5.993408203125, 6.2271728515625, 6.4609375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 9.0, 4.0, 7.0, 13.0, 13.0, 26.0, 34.0, 56.0, 51.0, 86.0, 99.0, 123.0, 169.0, 217.0, 258.0, 313.0, 407.0, 431.0, 389.0, 304.0, 268.0, 181.0, 163.0, 126.0, 69.0, 63.0, 55.0, 34.0, 28.0, 21.0, 14.0, 15.0, 8.0, 9.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.34375, -11.9735107421875, -11.603271484375, -11.2330322265625, -10.86279296875, -10.4925537109375, -10.122314453125, -9.7520751953125, -9.3818359375, -9.0115966796875, -8.641357421875, -8.2711181640625, -7.90087890625, -7.5306396484375, -7.160400390625, -6.7901611328125, -6.419921875, -6.0496826171875, -5.679443359375, -5.3092041015625, -4.93896484375, -4.5687255859375, -4.198486328125, -3.8282470703125, -3.4580078125, -3.0877685546875, -2.717529296875, -2.3472900390625, -1.97705078125, -1.6068115234375, -1.236572265625, -0.8663330078125, -0.49609375, -0.1258544921875, 0.244384765625, 0.6146240234375, 0.98486328125, 1.3551025390625, 1.725341796875, 2.0955810546875, 2.4658203125, 2.8360595703125, 3.206298828125, 3.5765380859375, 3.94677734375, 4.3170166015625, 4.687255859375, 5.0574951171875, 5.427734375, 5.7979736328125, 6.168212890625, 6.5384521484375, 6.90869140625, 7.2789306640625, 7.649169921875, 8.0194091796875, 8.3896484375, 8.7598876953125, 9.130126953125, 9.5003662109375, 9.87060546875, 10.2408447265625, 10.611083984375, 10.9813232421875, 11.3515625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 5.0, 3.0, 6.0, 11.0, 16.0, 15.0, 19.0, 45.0, 41.0, 47.0, 69.0, 102.0, 208.0, 328.0, 659.0, 5798.0, 2516190.0, 1664520.0, 4604.0, 691.0, 316.0, 192.0, 97.0, 73.0, 57.0, 41.0, 41.0, 22.0, 20.0, 11.0, 13.0, 5.0, 6.0, 5.0, 1.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.96875, -34.25341796875, -32.5380859375, -30.82275390625, -29.107421875, -27.39208984375, -25.6767578125, -23.96142578125, -22.24609375, -20.53076171875, -18.8154296875, -17.10009765625, -15.384765625, -13.66943359375, -11.9541015625, -10.23876953125, -8.5234375, -6.80810546875, -5.0927734375, -3.37744140625, -1.662109375, 0.05322265625, 1.7685546875, 3.48388671875, 5.19921875, 6.91455078125, 8.6298828125, 10.34521484375, 12.060546875, 13.77587890625, 15.4912109375, 17.20654296875, 18.921875, 20.63720703125, 22.3525390625, 24.06787109375, 25.783203125, 27.49853515625, 29.2138671875, 30.92919921875, 32.64453125, 34.35986328125, 36.0751953125, 37.79052734375, 39.505859375, 41.22119140625, 42.9365234375, 44.65185546875, 46.3671875, 48.08251953125, 49.7978515625, 51.51318359375, 53.228515625, 54.94384765625, 56.6591796875, 58.37451171875, 60.08984375, 61.80517578125, 63.5205078125, 65.23583984375, 66.951171875, 68.66650390625, 70.3818359375, 72.09716796875, 73.8125]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 17.0, 45.0, 85.0, 140.0, 173.0, 198.0, 158.0, 102.0, 50.0, 23.0, 10.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-83.11483001708984, -80.53240203857422, -77.9499740600586, -75.36753845214844, -72.78511047363281, -70.20268249511719, -67.62025451660156, -65.03782653808594, -62.45539855957031, -59.87297058105469, -57.2905387878418, -54.70811080932617, -52.12568283081055, -49.543251037597656, -46.96082305908203, -44.378395080566406, -41.795963287353516, -39.21353530883789, -36.631103515625, -34.048675537109375, -31.46624755859375, -28.883817672729492, -26.301387786865234, -23.71895980834961, -21.13652992248535, -18.554100036621094, -15.971672058105469, -13.389242172241211, -10.80681324005127, -8.224384307861328, -5.64195442199707, -3.0595264434814453, -0.4770965576171875, 2.105332612991333, 4.6877617835998535, 7.270191192626953, 9.852620124816895, 12.435049057006836, 15.017478942871094, 17.59990692138672, 20.182336807250977, 22.764766693115234, 25.34719467163086, 27.929624557495117, 30.512054443359375, 33.094482421875, 35.676910400390625, 38.25933837890625, 40.84177017211914, 43.424198150634766, 46.006629943847656, 48.58905792236328, 51.171485900878906, 53.75391387939453, 56.33634567260742, 58.91877365112305, 61.50120544433594, 64.08363342285156, 66.66606140136719, 69.24848937988281, 71.83092498779297, 74.4133529663086, 76.99578094482422, 79.57820892333984, 82.16063690185547]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 8.0, 3.0, 3.0, 3.0, 9.0, 9.0, 16.0, 16.0, 19.0, 19.0, 18.0, 27.0, 28.0, 35.0, 39.0, 37.0, 38.0, 33.0, 41.0, 36.0, 39.0, 43.0, 45.0, 36.0, 37.0, 45.0, 38.0, 32.0, 43.0, 32.0, 29.0, 23.0, 31.0, 22.0, 8.0, 15.0, 6.0, 14.0, 4.0, 4.0, 10.0, 7.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-47.71888732910156, -46.35163116455078, -44.984375, -43.61711883544922, -42.24986267089844, -40.882606506347656, -39.515350341796875, -38.148094177246094, -36.78083801269531, -35.41358184814453, -34.04632568359375, -32.67906951904297, -31.311813354492188, -29.944557189941406, -28.577299118041992, -27.21004295349121, -25.842784881591797, -24.475528717041016, -23.108272552490234, -21.741016387939453, -20.373760223388672, -19.00650405883789, -17.639245986938477, -16.271989822387695, -14.904733657836914, -13.537477493286133, -12.170221328735352, -10.802964210510254, -9.435708045959473, -8.068451881408691, -6.701194763183594, -5.3339385986328125, -3.9666824340820312, -2.599426031112671, -1.2321696281433105, 0.1350870132446289, 1.5023431777954102, 2.8695993423461914, 4.236856460571289, 5.60411262512207, 6.971368789672852, 8.338624954223633, 9.705881118774414, 11.073138236999512, 12.440394401550293, 13.807650566101074, 15.174907684326172, 16.542163848876953, 17.909420013427734, 19.276676177978516, 20.643932342529297, 22.011188507080078, 23.37844467163086, 24.74570083618164, 26.112958908081055, 27.480215072631836, 28.847471237182617, 30.2147274017334, 31.58198356628418, 32.949241638183594, 34.316497802734375, 35.683753967285156, 37.05101013183594, 38.41826629638672, 39.7855224609375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 10.0, 9.0, 14.0, 20.0, 11.0, 17.0, 23.0, 20.0, 20.0, 22.0, 33.0, 31.0, 33.0, 30.0, 50.0, 36.0, 40.0, 36.0, 44.0, 46.0, 35.0, 39.0, 19.0, 40.0, 36.0, 33.0, 25.0, 21.0, 24.0, 18.0, 25.0, 27.0, 19.0, 9.0, 14.0, 16.0, 4.0, 11.0, 10.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.140625, -4.98822021484375, -4.8358154296875, -4.68341064453125, -4.531005859375, -4.37860107421875, -4.2261962890625, -4.07379150390625, -3.92138671875, -3.76898193359375, -3.6165771484375, -3.46417236328125, -3.311767578125, -3.15936279296875, -3.0069580078125, -2.85455322265625, -2.7021484375, -2.54974365234375, -2.3973388671875, -2.24493408203125, -2.092529296875, -1.94012451171875, -1.7877197265625, -1.63531494140625, -1.48291015625, -1.33050537109375, -1.1781005859375, -1.02569580078125, -0.873291015625, -0.72088623046875, -0.5684814453125, -0.41607666015625, -0.263671875, -0.11126708984375, 0.0411376953125, 0.19354248046875, 0.345947265625, 0.49835205078125, 0.6507568359375, 0.80316162109375, 0.95556640625, 1.10797119140625, 1.2603759765625, 1.41278076171875, 1.565185546875, 1.71759033203125, 1.8699951171875, 2.02239990234375, 2.1748046875, 2.32720947265625, 2.4796142578125, 2.63201904296875, 2.784423828125, 2.93682861328125, 3.0892333984375, 3.24163818359375, 3.39404296875, 3.54644775390625, 3.6988525390625, 3.85125732421875, 4.003662109375, 4.15606689453125, 4.3084716796875, 4.46087646484375, 4.61328125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 12.0, 11.0, 17.0, 20.0, 24.0, 61.0, 100.0, 121.0, 191.0, 258.0, 387.0, 536.0, 791.0, 1058.0, 1452.0, 2111.0, 2852.0, 3844.0, 5448.0, 7312.0, 9868.0, 14103.0, 19425.0, 27614.0, 39804.0, 58769.0, 92346.0, 173230.0, 238090.0, 118152.0, 70556.0, 46805.0, 32254.0, 22742.0, 16148.0, 11412.0, 8411.0, 6205.0, 4616.0, 3149.0, 2288.0, 1763.0, 1238.0, 927.0, 668.0, 429.0, 291.0, 205.0, 151.0, 105.0, 54.0, 54.0, 38.0, 17.0, 16.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.73291015625, -0.7086563110351562, -0.6844024658203125, -0.6601486206054688, -0.635894775390625, -0.6116409301757812, -0.5873870849609375, -0.5631332397460938, -0.53887939453125, -0.5146255493164062, -0.4903717041015625, -0.46611785888671875, -0.441864013671875, -0.41761016845703125, -0.3933563232421875, -0.36910247802734375, -0.3448486328125, -0.32059478759765625, -0.2963409423828125, -0.27208709716796875, -0.247833251953125, -0.22357940673828125, -0.1993255615234375, -0.17507171630859375, -0.15081787109375, -0.12656402587890625, -0.1023101806640625, -0.07805633544921875, -0.053802490234375, -0.02954864501953125, -0.0052947998046875, 0.01895904541015625, 0.043212890625, 0.06746673583984375, 0.0917205810546875, 0.11597442626953125, 0.140228271484375, 0.16448211669921875, 0.1887359619140625, 0.21298980712890625, 0.23724365234375, 0.26149749755859375, 0.2857513427734375, 0.31000518798828125, 0.334259033203125, 0.35851287841796875, 0.3827667236328125, 0.40702056884765625, 0.4312744140625, 0.45552825927734375, 0.4797821044921875, 0.5040359497070312, 0.528289794921875, 0.5525436401367188, 0.5767974853515625, 0.6010513305664062, 0.62530517578125, 0.6495590209960938, 0.6738128662109375, 0.6980667114257812, 0.722320556640625, 0.7465744018554688, 0.7708282470703125, 0.7950820922851562, 0.8193359375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 6.0, 0.0, 3.0, 5.0, 3.0, 9.0, 5.0, 5.0, 5.0, 5.0, 8.0, 5.0, 16.0, 16.0, 12.0, 11.0, 25.0, 24.0, 22.0, 19.0, 27.0, 32.0, 34.0, 31.0, 35.0, 48.0, 46.0, 34.0, 1065.0, 29.0, 34.0, 26.0, 39.0, 31.0, 36.0, 38.0, 35.0, 30.0, 28.0, 28.0, 27.0, 18.0, 9.0, 13.0, 12.0, 5.0, 12.0, 6.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.052734375, -2.958404541015625, -2.86407470703125, -2.769744873046875, -2.6754150390625, -2.581085205078125, -2.48675537109375, -2.392425537109375, -2.298095703125, -2.203765869140625, -2.10943603515625, -2.015106201171875, -1.9207763671875, -1.826446533203125, -1.73211669921875, -1.637786865234375, -1.54345703125, -1.449127197265625, -1.35479736328125, -1.260467529296875, -1.1661376953125, -1.071807861328125, -0.97747802734375, -0.883148193359375, -0.788818359375, -0.694488525390625, -0.60015869140625, -0.505828857421875, -0.4114990234375, -0.317169189453125, -0.22283935546875, -0.128509521484375, -0.0341796875, 0.060150146484375, 0.15447998046875, 0.248809814453125, 0.3431396484375, 0.437469482421875, 0.53179931640625, 0.626129150390625, 0.720458984375, 0.814788818359375, 0.90911865234375, 1.003448486328125, 1.0977783203125, 1.192108154296875, 1.28643798828125, 1.380767822265625, 1.47509765625, 1.569427490234375, 1.66375732421875, 1.758087158203125, 1.8524169921875, 1.946746826171875, 2.04107666015625, 2.135406494140625, 2.229736328125, 2.324066162109375, 2.41839599609375, 2.512725830078125, 2.6070556640625, 2.701385498046875, 2.79571533203125, 2.890045166015625, 2.984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 12.0, 4.0, 15.0, 12.0, 16.0, 24.0, 52.0, 85.0, 164.0, 283.0, 476.0, 845.0, 1372.0, 2372.0, 4251.0, 7870.0, 14374.0, 27120.0, 54992.0, 119839.0, 1427172.0, 251072.0, 91951.0, 43858.0, 22283.0, 11871.0, 6485.0, 3465.0, 2069.0, 1146.0, 663.0, 355.0, 241.0, 118.0, 69.0, 39.0, 24.0, 11.0, 11.0, 7.0, 5.0, 6.0, 4.0, 10.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.466796875, -1.4207305908203125, -1.374664306640625, -1.3285980224609375, -1.28253173828125, -1.2364654541015625, -1.190399169921875, -1.1443328857421875, -1.0982666015625, -1.0522003173828125, -1.006134033203125, -0.9600677490234375, -0.91400146484375, -0.8679351806640625, -0.821868896484375, -0.7758026123046875, -0.729736328125, -0.6836700439453125, -0.637603759765625, -0.5915374755859375, -0.54547119140625, -0.4994049072265625, -0.453338623046875, -0.4072723388671875, -0.3612060546875, -0.3151397705078125, -0.269073486328125, -0.2230072021484375, -0.17694091796875, -0.1308746337890625, -0.084808349609375, -0.0387420654296875, 0.00732421875, 0.0533905029296875, 0.099456787109375, 0.1455230712890625, 0.19158935546875, 0.2376556396484375, 0.283721923828125, 0.3297882080078125, 0.3758544921875, 0.4219207763671875, 0.467987060546875, 0.5140533447265625, 0.56011962890625, 0.6061859130859375, 0.652252197265625, 0.6983184814453125, 0.744384765625, 0.7904510498046875, 0.836517333984375, 0.8825836181640625, 0.92864990234375, 0.9747161865234375, 1.020782470703125, 1.0668487548828125, 1.1129150390625, 1.1589813232421875, 1.205047607421875, 1.2511138916015625, 1.29718017578125, 1.3432464599609375, 1.389312744140625, 1.4353790283203125, 1.4814453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 3.0, 5.0, 3.0, 5.0, 9.0, 10.0, 12.0, 13.0, 23.0, 17.0, 19.0, 16.0, 28.0, 25.0, 29.0, 43.0, 39.0, 45.0, 48.0, 50.0, 62.0, 61.0, 47.0, 46.0, 39.0, 40.0, 27.0, 35.0, 24.0, 21.0, 18.0, 24.0, 12.0, 20.0, 13.0, 10.0, 6.0, 9.0, 6.0, 5.0, 4.0, 7.0, 5.0, 2.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0005092620849609375, -0.0004917755722999573, -0.00047428905963897705, -0.0004568025469779968, -0.0004393160343170166, -0.0004218295216560364, -0.00040434300899505615, -0.00038685649633407593, -0.0003693699836730957, -0.0003518834710121155, -0.00033439695835113525, -0.00031691044569015503, -0.0002994239330291748, -0.0002819374203681946, -0.00026445090770721436, -0.00024696439504623413, -0.0002294778823852539, -0.00021199136972427368, -0.00019450485706329346, -0.00017701834440231323, -0.000159531831741333, -0.00014204531908035278, -0.00012455880641937256, -0.00010707229375839233, -8.958578109741211e-05, -7.209926843643188e-05, -5.461275577545166e-05, -3.7126243114471436e-05, -1.963973045349121e-05, -2.1532177925109863e-06, 1.5333294868469238e-05, 3.281980752944946e-05, 5.030632019042969e-05, 6.779283285140991e-05, 8.527934551239014e-05, 0.00010276585817337036, 0.00012025237083435059, 0.0001377388834953308, 0.00015522539615631104, 0.00017271190881729126, 0.00019019842147827148, 0.0002076849341392517, 0.00022517144680023193, 0.00024265795946121216, 0.0002601444721221924, 0.0002776309847831726, 0.00029511749744415283, 0.00031260401010513306, 0.0003300905227661133, 0.0003475770354270935, 0.00036506354808807373, 0.00038255006074905396, 0.0004000365734100342, 0.0004175230860710144, 0.00043500959873199463, 0.00045249611139297485, 0.0004699826240539551, 0.0004874691367149353, 0.0005049556493759155, 0.0005224421620368958, 0.000539928674697876, 0.0005574151873588562, 0.0005749017000198364, 0.0005923882126808167, 0.0006098747253417969]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 4.0, 1.0, 6.0, 2.0, 9.0, 12.0, 7.0, 12.0, 19.0, 15.0, 25.0, 24.0, 45.0, 48.0, 76.0, 102.0, 117.0, 161.0, 263.0, 495.0, 1271.0, 110113.0, 929952.0, 3960.0, 664.0, 337.0, 224.0, 144.0, 101.0, 92.0, 58.0, 49.0, 40.0, 24.0, 23.0, 11.0, 9.0, 10.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.01175689697265625, -0.0113677978515625, -0.01097869873046875, -0.010589599609375, -0.01020050048828125, -0.0098114013671875, -0.00942230224609375, -0.009033203125, -0.00864410400390625, -0.0082550048828125, -0.00786590576171875, -0.007476806640625, -0.00708770751953125, -0.0066986083984375, -0.00630950927734375, -0.00592041015625, -0.00553131103515625, -0.0051422119140625, -0.00475311279296875, -0.004364013671875, -0.00397491455078125, -0.0035858154296875, -0.00319671630859375, -0.0028076171875, -0.00241851806640625, -0.0020294189453125, -0.00164031982421875, -0.001251220703125, -0.00086212158203125, -0.0004730224609375, -8.392333984375e-05, 0.00030517578125, 0.00069427490234375, 0.0010833740234375, 0.00147247314453125, 0.001861572265625, 0.00225067138671875, 0.0026397705078125, 0.00302886962890625, 0.00341796875, 0.00380706787109375, 0.0041961669921875, 0.00458526611328125, 0.004974365234375, 0.00536346435546875, 0.0057525634765625, 0.00614166259765625, 0.00653076171875, 0.00691986083984375, 0.0073089599609375, 0.00769805908203125, 0.008087158203125, 0.00847625732421875, 0.0088653564453125, 0.00925445556640625, 0.0096435546875, 0.01003265380859375, 0.0104217529296875, 0.01081085205078125, 0.011199951171875, 0.01158905029296875, 0.0119781494140625, 0.01236724853515625, 0.01275634765625, 0.01314544677734375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 14.0, 162.0, 511.0, 283.0, 42.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011940239928662777, -0.0011333228321745992, -0.0010726216714829206, -0.001011920627206564, -0.0009512194083072245, -0.0008905183058232069, -0.0008298171451315284, -0.0007691159844398499, -0.0007084148237481713, -0.0006477136630564928, -0.0005870125605724752, -0.0005263113998807967, -0.00046561023918911815, -0.0004049091076012701, -0.000344207976013422, -0.0002835068153217435, -0.00022280571283772588, -0.00016210456669796258, -0.0001014034278341569, -4.070228897035122e-05, 1.9998857169412076e-05, 8.070000330917537e-05, 0.00014140113489702344, 0.00020210229558870196, 0.00026280342717655003, 0.0003235045587643981, 0.0003842057194560766, 0.0004449068510439247, 0.0005056079826317728, 0.0005663091433234513, 0.0006270102458074689, 0.0006877114064991474, 0.0007484125671908259, 0.0008091137278825045, 0.0008698148303665221, 0.0009305159910582006, 0.0009912170935422182, 0.0010519182542338967, 0.0011126194149255753, 0.0011733205756172538, 0.0012340217363089323, 0.0012947228970006108, 0.0013554240576922894, 0.001416125101968646, 0.0014768262626603246, 0.001537527423352003, 0.0015982285840436816, 0.0016589297447353601, 0.0017196307890117168, 0.0017803319497033954, 0.0018410331103950739, 0.0019017341546714306, 0.001962435431778431, 0.0020231364760547876, 0.0020838375203311443, 0.0021445387974381447, 0.002205240074545145, 0.0022659411188215017, 0.002326642395928502, 0.0023873434402048588, 0.002448044717311859, 0.002508745761588216, 0.0025694468058645725, 0.002630148082971573, 0.0026908491272479296]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 8.0, 12.0, 11.0, 9.0, 11.0, 24.0, 15.0, 16.0, 15.0, 25.0, 39.0, 38.0, 35.0, 32.0, 54.0, 38.0, 38.0, 38.0, 44.0, 40.0, 41.0, 43.0, 35.0, 52.0, 33.0, 31.0, 25.0, 29.0, 29.0, 18.0, 17.0, 25.0, 21.0, 10.0, 10.0, 4.0, 11.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0003700852394104004, -0.0003587193787097931, -0.0003473535180091858, -0.0003359876573085785, -0.0003246217966079712, -0.0003132559359073639, -0.0003018900752067566, -0.0002905242145061493, -0.000279158353805542, -0.0002677924931049347, -0.0002564266324043274, -0.0002450607717037201, -0.0002336949110031128, -0.0002223290503025055, -0.0002109631896018982, -0.0001995973289012909, -0.0001882314682006836, -0.0001768656075000763, -0.000165499746799469, -0.0001541338860988617, -0.0001427680253982544, -0.0001314021646976471, -0.0001200363039970398, -0.0001086704432964325, -9.73045825958252e-05, -8.59387218952179e-05, -7.45728611946106e-05, -6.32070004940033e-05, -5.1841139793395996e-05, -4.0475279092788696e-05, -2.9109418392181396e-05, -1.7743557691574097e-05, -6.377696990966797e-06, 4.988163709640503e-06, 1.6354024410247803e-05, 2.7719885110855103e-05, 3.90857458114624e-05, 5.04516065120697e-05, 6.1817467212677e-05, 7.31833279132843e-05, 8.45491886138916e-05, 9.59150493144989e-05, 0.0001072809100151062, 0.0001186467707157135, 0.0001300126314163208, 0.0001413784921169281, 0.0001527443528175354, 0.0001641102135181427, 0.00017547607421875, 0.0001868419349193573, 0.0001982077956199646, 0.0002095736563205719, 0.0002209395170211792, 0.0002323053777217865, 0.0002436712384223938, 0.0002550370991230011, 0.0002664029598236084, 0.0002777688205242157, 0.000289134681224823, 0.0003005005419254303, 0.0003118664026260376, 0.0003232322633266449, 0.0003345981240272522, 0.0003459639847278595, 0.0003573298454284668]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 8.0, 10.0, 9.0, 14.0, 20.0, 11.0, 17.0, 23.0, 20.0, 20.0, 22.0, 33.0, 31.0, 33.0, 30.0, 50.0, 37.0, 39.0, 36.0, 44.0, 46.0, 35.0, 39.0, 19.0, 40.0, 36.0, 33.0, 25.0, 21.0, 24.0, 18.0, 26.0, 26.0, 19.0, 9.0, 14.0, 16.0, 4.0, 11.0, 10.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.140625, -4.98822021484375, -4.8358154296875, -4.68341064453125, -4.531005859375, -4.37860107421875, -4.2261962890625, -4.07379150390625, -3.92138671875, -3.76898193359375, -3.6165771484375, -3.46417236328125, -3.311767578125, -3.15936279296875, -3.0069580078125, -2.85455322265625, -2.7021484375, -2.54974365234375, -2.3973388671875, -2.24493408203125, -2.092529296875, -1.94012451171875, -1.7877197265625, -1.63531494140625, -1.48291015625, -1.33050537109375, -1.1781005859375, -1.02569580078125, -0.873291015625, -0.72088623046875, -0.5684814453125, -0.41607666015625, -0.263671875, -0.11126708984375, 0.0411376953125, 0.19354248046875, 0.345947265625, 0.49835205078125, 0.6507568359375, 0.80316162109375, 0.95556640625, 1.10797119140625, 1.2603759765625, 1.41278076171875, 1.565185546875, 1.71759033203125, 1.8699951171875, 2.02239990234375, 2.1748046875, 2.32720947265625, 2.4796142578125, 2.63201904296875, 2.784423828125, 2.93682861328125, 3.0892333984375, 3.24163818359375, 3.39404296875, 3.54644775390625, 3.6988525390625, 3.85125732421875, 4.003662109375, 4.15606689453125, 4.3084716796875, 4.46087646484375, 4.61328125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 13.0, 20.0, 19.0, 26.0, 42.0, 66.0, 83.0, 125.0, 196.0, 378.0, 641.0, 1177.0, 2267.0, 4722.0, 10122.0, 25047.0, 69792.0, 261003.0, 463921.0, 135896.0, 42618.0, 16178.0, 6967.0, 3298.0, 1695.0, 947.0, 491.0, 271.0, 169.0, 109.0, 69.0, 54.0, 34.0, 18.0, 23.0, 15.0, 7.0, 7.0, 6.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.60546875, -4.467041015625, -4.32861328125, -4.190185546875, -4.0517578125, -3.913330078125, -3.77490234375, -3.636474609375, -3.498046875, -3.359619140625, -3.22119140625, -3.082763671875, -2.9443359375, -2.805908203125, -2.66748046875, -2.529052734375, -2.390625, -2.252197265625, -2.11376953125, -1.975341796875, -1.8369140625, -1.698486328125, -1.56005859375, -1.421630859375, -1.283203125, -1.144775390625, -1.00634765625, -0.867919921875, -0.7294921875, -0.591064453125, -0.45263671875, -0.314208984375, -0.17578125, -0.037353515625, 0.10107421875, 0.239501953125, 0.3779296875, 0.516357421875, 0.65478515625, 0.793212890625, 0.931640625, 1.070068359375, 1.20849609375, 1.346923828125, 1.4853515625, 1.623779296875, 1.76220703125, 1.900634765625, 2.0390625, 2.177490234375, 2.31591796875, 2.454345703125, 2.5927734375, 2.731201171875, 2.86962890625, 3.008056640625, 3.146484375, 3.284912109375, 3.42333984375, 3.561767578125, 3.7001953125, 3.838623046875, 3.97705078125, 4.115478515625, 4.25390625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 5.0, 6.0, 17.0, 10.0, 13.0, 15.0, 15.0, 27.0, 33.0, 30.0, 41.0, 47.0, 39.0, 48.0, 69.0, 118.0, 425.0, 1526.0, 109.0, 64.0, 44.0, 40.0, 43.0, 45.0, 35.0, 36.0, 27.0, 26.0, 20.0, 12.0, 12.0, 10.0, 8.0, 9.0, 4.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.90625, -17.309814453125, -16.71337890625, -16.116943359375, -15.5205078125, -14.924072265625, -14.32763671875, -13.731201171875, -13.134765625, -12.538330078125, -11.94189453125, -11.345458984375, -10.7490234375, -10.152587890625, -9.55615234375, -8.959716796875, -8.36328125, -7.766845703125, -7.17041015625, -6.573974609375, -5.9775390625, -5.381103515625, -4.78466796875, -4.188232421875, -3.591796875, -2.995361328125, -2.39892578125, -1.802490234375, -1.2060546875, -0.609619140625, -0.01318359375, 0.583251953125, 1.1796875, 1.776123046875, 2.37255859375, 2.968994140625, 3.5654296875, 4.161865234375, 4.75830078125, 5.354736328125, 5.951171875, 6.547607421875, 7.14404296875, 7.740478515625, 8.3369140625, 8.933349609375, 9.52978515625, 10.126220703125, 10.72265625, 11.319091796875, 11.91552734375, 12.511962890625, 13.1083984375, 13.704833984375, 14.30126953125, 14.897705078125, 15.494140625, 16.090576171875, 16.68701171875, 17.283447265625, 17.8798828125, 18.476318359375, 19.07275390625, 19.669189453125, 20.265625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 5.0, 3.0, 15.0, 7.0, 9.0, 11.0, 6.0, 26.0, 19.0, 24.0, 36.0, 42.0, 57.0, 67.0, 94.0, 141.0, 203.0, 328.0, 562.0, 3439.0, 495868.0, 2637591.0, 5402.0, 691.0, 308.0, 202.0, 141.0, 112.0, 63.0, 53.0, 49.0, 24.0, 22.0, 21.0, 13.0, 15.0, 13.0, 11.0, 3.0, 3.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-40.96875, -39.7666015625, -38.564453125, -37.3623046875, -36.16015625, -34.9580078125, -33.755859375, -32.5537109375, -31.3515625, -30.1494140625, -28.947265625, -27.7451171875, -26.54296875, -25.3408203125, -24.138671875, -22.9365234375, -21.734375, -20.5322265625, -19.330078125, -18.1279296875, -16.92578125, -15.7236328125, -14.521484375, -13.3193359375, -12.1171875, -10.9150390625, -9.712890625, -8.5107421875, -7.30859375, -6.1064453125, -4.904296875, -3.7021484375, -2.5, -1.2978515625, -0.095703125, 1.1064453125, 2.30859375, 3.5107421875, 4.712890625, 5.9150390625, 7.1171875, 8.3193359375, 9.521484375, 10.7236328125, 11.92578125, 13.1279296875, 14.330078125, 15.5322265625, 16.734375, 17.9365234375, 19.138671875, 20.3408203125, 21.54296875, 22.7451171875, 23.947265625, 25.1494140625, 26.3515625, 27.5537109375, 28.755859375, 29.9580078125, 31.16015625, 32.3623046875, 33.564453125, 34.7666015625, 35.96875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [714.0, 302.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.803107261657715, 0.6613492965698242, 10.125805854797363, 19.59026336669922, 29.054718017578125, 38.51917266845703, 47.9836311340332, 57.448089599609375, 66.91254425048828, 76.37699890136719, 85.84146118164062, 95.30591583251953, 104.77037048339844, 114.23482513427734, 123.69927978515625, 133.1637420654297, 142.62820434570312, 152.09266662597656, 161.55711364746094, 171.02157592773438, 180.48602294921875, 189.9504852294922, 199.41494750976562, 208.87939453125, 218.34385681152344, 227.80831909179688, 237.27276611328125, 246.7372283935547, 256.2016906738281, 265.6661376953125, 275.1305847167969, 284.5950622558594, 294.05950927734375, 303.5239562988281, 312.9884338378906, 322.452880859375, 331.9173278808594, 341.38177490234375, 350.84625244140625, 360.3106994628906, 369.775146484375, 379.2395935058594, 388.7040710449219, 398.16851806640625, 407.6329650878906, 417.097412109375, 426.5618896484375, 436.0263366699219, 445.4908142089844, 454.95526123046875, 464.41973876953125, 473.8841857910156, 483.3486328125, 492.8131103515625, 502.2775573730469, 511.74200439453125, 521.2064819335938, 530.6709594726562, 540.1353759765625, 549.599853515625, 559.0643310546875, 568.5287475585938, 577.9932250976562, 587.4577026367188, 596.922119140625]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 6.0, 11.0, 3.0, 8.0, 8.0, 16.0, 10.0, 9.0, 23.0, 19.0, 16.0, 26.0, 21.0, 27.0, 21.0, 29.0, 36.0, 29.0, 48.0, 39.0, 33.0, 41.0, 42.0, 35.0, 41.0, 35.0, 35.0, 39.0, 34.0, 35.0, 36.0, 27.0, 27.0, 24.0, 27.0, 12.0, 9.0, 13.0, 8.0, 11.0, 9.0, 4.0, 3.0, 5.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-42.932701110839844, -41.670677185058594, -40.40865707397461, -39.14663314819336, -37.884613037109375, -36.622589111328125, -35.360565185546875, -34.098541259765625, -32.83652114868164, -31.574499130249023, -30.312477111816406, -29.050453186035156, -27.78843116760254, -26.526409149169922, -25.264385223388672, -24.002363204956055, -22.740341186523438, -21.47831916809082, -20.216297149658203, -18.954273223876953, -17.692251205444336, -16.43022918701172, -15.168206214904785, -13.906183242797852, -12.644161224365234, -11.382139205932617, -10.120116233825684, -8.85809326171875, -7.596071243286133, -6.334048748016357, -5.072026252746582, -3.8100032806396484, -2.5479812622070312, -1.2859587669372559, -0.02393627166748047, 1.238086223602295, 2.5001087188720703, 3.7621312141418457, 5.024153709411621, 6.286176681518555, 7.548198699951172, 8.810220718383789, 10.072243690490723, 11.334266662597656, 12.596288681030273, 13.85831069946289, 15.120333671569824, 16.382356643676758, 17.644378662109375, 18.906400680541992, 20.16842269897461, 21.43044662475586, 22.692468643188477, 23.954490661621094, 25.216514587402344, 26.47853660583496, 27.740558624267578, 29.002580642700195, 30.264602661132812, 31.526626586914062, 32.78865051269531, 34.0506706237793, 35.31269454956055, 36.57471466064453, 37.83673858642578]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 11.0, 8.0, 14.0, 10.0, 17.0, 14.0, 18.0, 19.0, 19.0, 21.0, 27.0, 31.0, 38.0, 40.0, 36.0, 38.0, 49.0, 36.0, 42.0, 43.0, 42.0, 45.0, 28.0, 37.0, 41.0, 29.0, 38.0, 16.0, 31.0, 18.0, 24.0, 24.0, 20.0, 12.0, 14.0, 8.0, 4.0, 11.0, 10.0, 13.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.78515625, -5.62091064453125, -5.4566650390625, -5.29241943359375, -5.128173828125, -4.96392822265625, -4.7996826171875, -4.63543701171875, -4.47119140625, -4.30694580078125, -4.1427001953125, -3.97845458984375, -3.814208984375, -3.64996337890625, -3.4857177734375, -3.32147216796875, -3.1572265625, -2.99298095703125, -2.8287353515625, -2.66448974609375, -2.500244140625, -2.33599853515625, -2.1717529296875, -2.00750732421875, -1.84326171875, -1.67901611328125, -1.5147705078125, -1.35052490234375, -1.186279296875, -1.02203369140625, -0.8577880859375, -0.69354248046875, -0.529296875, -0.36505126953125, -0.2008056640625, -0.03656005859375, 0.127685546875, 0.29193115234375, 0.4561767578125, 0.62042236328125, 0.78466796875, 0.94891357421875, 1.1131591796875, 1.27740478515625, 1.441650390625, 1.60589599609375, 1.7701416015625, 1.93438720703125, 2.0986328125, 2.26287841796875, 2.4271240234375, 2.59136962890625, 2.755615234375, 2.91986083984375, 3.0841064453125, 3.24835205078125, 3.41259765625, 3.57684326171875, 3.7410888671875, 3.90533447265625, 4.069580078125, 4.23382568359375, 4.3980712890625, 4.56231689453125, 4.7265625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 7.0, 5.0, 5.0, 8.0, 10.0, 10.0, 7.0, 17.0, 21.0, 15.0, 16.0, 18.0, 23.0, 42.0, 43.0, 58.0, 111.0, 130.0, 183.0, 476.0, 3497.0, 318155.0, 3811867.0, 56859.0, 1704.0, 363.0, 150.0, 117.0, 75.0, 60.0, 27.0, 33.0, 29.0, 20.0, 16.0, 22.0, 17.0, 12.0, 13.0, 8.0, 11.0, 6.0, 9.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.953125, -31.04931640625, -30.1455078125, -29.24169921875, -28.337890625, -27.43408203125, -26.5302734375, -25.62646484375, -24.72265625, -23.81884765625, -22.9150390625, -22.01123046875, -21.107421875, -20.20361328125, -19.2998046875, -18.39599609375, -17.4921875, -16.58837890625, -15.6845703125, -14.78076171875, -13.876953125, -12.97314453125, -12.0693359375, -11.16552734375, -10.26171875, -9.35791015625, -8.4541015625, -7.55029296875, -6.646484375, -5.74267578125, -4.8388671875, -3.93505859375, -3.03125, -2.12744140625, -1.2236328125, -0.31982421875, 0.583984375, 1.48779296875, 2.3916015625, 3.29541015625, 4.19921875, 5.10302734375, 6.0068359375, 6.91064453125, 7.814453125, 8.71826171875, 9.6220703125, 10.52587890625, 11.4296875, 12.33349609375, 13.2373046875, 14.14111328125, 15.044921875, 15.94873046875, 16.8525390625, 17.75634765625, 18.66015625, 19.56396484375, 20.4677734375, 21.37158203125, 22.275390625, 23.17919921875, 24.0830078125, 24.98681640625, 25.890625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 11.0, 22.0, 20.0, 28.0, 41.0, 57.0, 73.0, 99.0, 144.0, 214.0, 250.0, 360.0, 412.0, 485.0, 434.0, 400.0, 266.0, 202.0, 140.0, 103.0, 82.0, 64.0, 41.0, 40.0, 20.0, 14.0, 11.0, 6.0, 9.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0859375, -12.684326171875, -12.28271484375, -11.881103515625, -11.4794921875, -11.077880859375, -10.67626953125, -10.274658203125, -9.873046875, -9.471435546875, -9.06982421875, -8.668212890625, -8.2666015625, -7.864990234375, -7.46337890625, -7.061767578125, -6.66015625, -6.258544921875, -5.85693359375, -5.455322265625, -5.0537109375, -4.652099609375, -4.25048828125, -3.848876953125, -3.447265625, -3.045654296875, -2.64404296875, -2.242431640625, -1.8408203125, -1.439208984375, -1.03759765625, -0.635986328125, -0.234375, 0.167236328125, 0.56884765625, 0.970458984375, 1.3720703125, 1.773681640625, 2.17529296875, 2.576904296875, 2.978515625, 3.380126953125, 3.78173828125, 4.183349609375, 4.5849609375, 4.986572265625, 5.38818359375, 5.789794921875, 6.19140625, 6.593017578125, 6.99462890625, 7.396240234375, 7.7978515625, 8.199462890625, 8.60107421875, 9.002685546875, 9.404296875, 9.805908203125, 10.20751953125, 10.609130859375, 11.0107421875, 11.412353515625, 11.81396484375, 12.215576171875, 12.6171875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 9.0, 4.0, 12.0, 12.0, 14.0, 19.0, 29.0, 39.0, 54.0, 63.0, 86.0, 95.0, 132.0, 154.0, 216.0, 378.0, 713.0, 2980.0, 105251.0, 3977485.0, 101494.0, 2959.0, 733.0, 383.0, 252.0, 166.0, 115.0, 75.0, 69.0, 68.0, 46.0, 26.0, 35.0, 31.0, 13.0, 18.0, 16.0, 10.0, 5.0, 5.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.96875, -36.587890625, -35.20703125, -33.826171875, -32.4453125, -31.064453125, -29.68359375, -28.302734375, -26.921875, -25.541015625, -24.16015625, -22.779296875, -21.3984375, -20.017578125, -18.63671875, -17.255859375, -15.875, -14.494140625, -13.11328125, -11.732421875, -10.3515625, -8.970703125, -7.58984375, -6.208984375, -4.828125, -3.447265625, -2.06640625, -0.685546875, 0.6953125, 2.076171875, 3.45703125, 4.837890625, 6.21875, 7.599609375, 8.98046875, 10.361328125, 11.7421875, 13.123046875, 14.50390625, 15.884765625, 17.265625, 18.646484375, 20.02734375, 21.408203125, 22.7890625, 24.169921875, 25.55078125, 26.931640625, 28.3125, 29.693359375, 31.07421875, 32.455078125, 33.8359375, 35.216796875, 36.59765625, 37.978515625, 39.359375, 40.740234375, 42.12109375, 43.501953125, 44.8828125, 46.263671875, 47.64453125, 49.025390625, 50.40625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 14.0, 66.0, 216.0, 361.0, 249.0, 84.0, 19.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-223.12876892089844, -217.8889617919922, -212.64915466308594, -207.4093475341797, -202.16954040527344, -196.9297332763672, -191.68992614746094, -186.45013427734375, -181.2103271484375, -175.97052001953125, -170.730712890625, -165.49090576171875, -160.2510986328125, -155.01129150390625, -149.771484375, -144.53167724609375, -139.2918701171875, -134.05206298828125, -128.812255859375, -123.57244873046875, -118.3326416015625, -113.09283447265625, -107.85303497314453, -102.61322784423828, -97.37342071533203, -92.13361358642578, -86.89380645751953, -81.65399932861328, -76.41419982910156, -71.17439270019531, -65.93458557128906, -60.69477844238281, -55.45497131347656, -50.21516418457031, -44.97535705566406, -39.73555374145508, -34.49574661254883, -29.255939483642578, -24.01613426208496, -18.776329040527344, -13.536521911621094, -8.29671573638916, -3.0569095611572266, 2.182896614074707, 7.422702789306641, 12.66250991821289, 17.902315139770508, 23.142120361328125, 28.381927490234375, 33.621734619140625, 38.861541748046875, 44.10134506225586, 49.34115219116211, 54.58095932006836, 59.820762634277344, 65.0605697631836, 70.30037689208984, 75.5401840209961, 80.77999114990234, 86.0197982788086, 91.25959777832031, 96.49940490722656, 101.73921203613281, 106.97901916503906, 112.21882629394531]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 5.0, 3.0, 2.0, 7.0, 11.0, 5.0, 9.0, 13.0, 9.0, 12.0, 11.0, 16.0, 19.0, 24.0, 16.0, 30.0, 38.0, 33.0, 24.0, 25.0, 46.0, 44.0, 36.0, 42.0, 40.0, 26.0, 51.0, 36.0, 44.0, 39.0, 33.0, 35.0, 22.0, 27.0, 18.0, 17.0, 24.0, 14.0, 15.0, 18.0, 14.0, 11.0, 18.0, 6.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.458343505859375, -36.26607894897461, -35.07381820678711, -33.881553649902344, -32.689292907714844, -31.497028350830078, -30.304765701293945, -29.112503051757812, -27.920238494873047, -26.727975845336914, -25.53571319580078, -24.343448638916016, -23.151185989379883, -21.95892333984375, -20.766660690307617, -19.574398040771484, -18.38213539123535, -17.18987274169922, -15.99760913848877, -14.805346488952637, -13.613082885742188, -12.420820236206055, -11.228557586669922, -10.036293983459473, -8.84403133392334, -7.651768207550049, -6.459505081176758, -5.267242431640625, -4.074979305267334, -2.882716178894043, -1.6904535293579102, -0.49818992614746094, 0.6940727233886719, 1.8863357305526733, 3.078598737716675, 4.270861625671387, 5.463124752044678, 6.655387878417969, 7.847650527954102, 9.03991413116455, 10.232176780700684, 11.424439430236816, 12.616703033447266, 13.808965682983398, 15.001228332519531, 16.193492889404297, 17.385753631591797, 18.578018188476562, 19.770280838012695, 20.962543487548828, 22.15480613708496, 23.347068786621094, 24.53933334350586, 25.731595993041992, 26.923858642578125, 28.11612319946289, 29.30838394165039, 30.500646591186523, 31.692909240722656, 32.88517379760742, 34.07743453979492, 35.26969909667969, 36.46195983886719, 37.65422439575195, 38.84648895263672]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 13.0, 11.0, 16.0, 12.0, 9.0, 15.0, 17.0, 17.0, 23.0, 33.0, 29.0, 20.0, 36.0, 38.0, 28.0, 47.0, 38.0, 38.0, 39.0, 42.0, 27.0, 31.0, 38.0, 28.0, 37.0, 35.0, 29.0, 28.0, 25.0, 21.0, 19.0, 21.0, 18.0, 24.0, 17.0, 12.0, 17.0, 12.0, 8.0, 7.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.98828125, -4.8350830078125, -4.681884765625, -4.5286865234375, -4.37548828125, -4.2222900390625, -4.069091796875, -3.9158935546875, -3.7626953125, -3.6094970703125, -3.456298828125, -3.3031005859375, -3.14990234375, -2.9967041015625, -2.843505859375, -2.6903076171875, -2.537109375, -2.3839111328125, -2.230712890625, -2.0775146484375, -1.92431640625, -1.7711181640625, -1.617919921875, -1.4647216796875, -1.3115234375, -1.1583251953125, -1.005126953125, -0.8519287109375, -0.69873046875, -0.5455322265625, -0.392333984375, -0.2391357421875, -0.0859375, 0.0672607421875, 0.220458984375, 0.3736572265625, 0.52685546875, 0.6800537109375, 0.833251953125, 0.9864501953125, 1.1396484375, 1.2928466796875, 1.446044921875, 1.5992431640625, 1.75244140625, 1.9056396484375, 2.058837890625, 2.2120361328125, 2.365234375, 2.5184326171875, 2.671630859375, 2.8248291015625, 2.97802734375, 3.1312255859375, 3.284423828125, 3.4376220703125, 3.5908203125, 3.7440185546875, 3.897216796875, 4.0504150390625, 4.20361328125, 4.3568115234375, 4.510009765625, 4.6632080078125, 4.81640625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 8.0, 9.0, 14.0, 14.0, 36.0, 45.0, 54.0, 111.0, 169.0, 220.0, 371.0, 596.0, 1053.0, 1778.0, 2950.0, 5037.0, 8448.0, 14400.0, 23978.0, 43000.0, 80092.0, 177474.0, 368006.0, 154013.0, 72701.0, 39432.0, 22197.0, 13088.0, 7775.0, 4619.0, 2742.0, 1589.0, 949.0, 596.0, 364.0, 208.0, 137.0, 86.0, 60.0, 42.0, 27.0, 27.0, 14.0, 4.0, 11.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.330078125, -1.287750244140625, -1.24542236328125, -1.203094482421875, -1.1607666015625, -1.118438720703125, -1.07611083984375, -1.033782958984375, -0.991455078125, -0.949127197265625, -0.90679931640625, -0.864471435546875, -0.8221435546875, -0.779815673828125, -0.73748779296875, -0.695159912109375, -0.65283203125, -0.610504150390625, -0.56817626953125, -0.525848388671875, -0.4835205078125, -0.441192626953125, -0.39886474609375, -0.356536865234375, -0.314208984375, -0.271881103515625, -0.22955322265625, -0.187225341796875, -0.1448974609375, -0.102569580078125, -0.06024169921875, -0.017913818359375, 0.0244140625, 0.066741943359375, 0.10906982421875, 0.151397705078125, 0.1937255859375, 0.236053466796875, 0.27838134765625, 0.320709228515625, 0.363037109375, 0.405364990234375, 0.44769287109375, 0.490020751953125, 0.5323486328125, 0.574676513671875, 0.61700439453125, 0.659332275390625, 0.70166015625, 0.743988037109375, 0.78631591796875, 0.828643798828125, 0.8709716796875, 0.913299560546875, 0.95562744140625, 0.997955322265625, 1.040283203125, 1.082611083984375, 1.12493896484375, 1.167266845703125, 1.2095947265625, 1.251922607421875, 1.29425048828125, 1.336578369140625, 1.37890625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 6.0, 7.0, 5.0, 8.0, 14.0, 14.0, 14.0, 15.0, 13.0, 23.0, 20.0, 21.0, 34.0, 27.0, 46.0, 36.0, 53.0, 37.0, 48.0, 35.0, 1069.0, 42.0, 37.0, 37.0, 41.0, 44.0, 29.0, 27.0, 27.0, 35.0, 27.0, 21.0, 20.0, 14.0, 17.0, 15.0, 10.0, 11.0, 10.0, 4.0, 5.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.814971923828125, -2.70611572265625, -2.597259521484375, -2.4884033203125, -2.379547119140625, -2.27069091796875, -2.161834716796875, -2.052978515625, -1.944122314453125, -1.83526611328125, -1.726409912109375, -1.6175537109375, -1.508697509765625, -1.39984130859375, -1.290985107421875, -1.18212890625, -1.073272705078125, -0.96441650390625, -0.855560302734375, -0.7467041015625, -0.637847900390625, -0.52899169921875, -0.420135498046875, -0.311279296875, -0.202423095703125, -0.09356689453125, 0.015289306640625, 0.1241455078125, 0.233001708984375, 0.34185791015625, 0.450714111328125, 0.5595703125, 0.668426513671875, 0.77728271484375, 0.886138916015625, 0.9949951171875, 1.103851318359375, 1.21270751953125, 1.321563720703125, 1.430419921875, 1.539276123046875, 1.64813232421875, 1.756988525390625, 1.8658447265625, 1.974700927734375, 2.08355712890625, 2.192413330078125, 2.30126953125, 2.410125732421875, 2.51898193359375, 2.627838134765625, 2.7366943359375, 2.845550537109375, 2.95440673828125, 3.063262939453125, 3.172119140625, 3.280975341796875, 3.38983154296875, 3.498687744140625, 3.6075439453125, 3.716400146484375, 3.82525634765625, 3.934112548828125, 4.04296875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 2.0, 3.0, 11.0, 5.0, 19.0, 16.0, 21.0, 29.0, 52.0, 96.0, 179.0, 342.0, 600.0, 1163.0, 2200.0, 4091.0, 8067.0, 15790.0, 32175.0, 69029.0, 177491.0, 1499100.0, 161079.0, 64353.0, 30289.0, 14918.0, 7650.0, 3850.0, 2140.0, 1080.0, 556.0, 309.0, 165.0, 88.0, 49.0, 31.0, 25.0, 25.0, 12.0, 7.0, 6.0, 10.0, 3.0, 0.0, 5.0, 3.0, 1.0, 3.0], "bins": [-1.9638671875, -1.91143798828125, -1.8590087890625, -1.80657958984375, -1.754150390625, -1.70172119140625, -1.6492919921875, -1.59686279296875, -1.54443359375, -1.49200439453125, -1.4395751953125, -1.38714599609375, -1.334716796875, -1.28228759765625, -1.2298583984375, -1.17742919921875, -1.125, -1.07257080078125, -1.0201416015625, -0.96771240234375, -0.915283203125, -0.86285400390625, -0.8104248046875, -0.75799560546875, -0.70556640625, -0.65313720703125, -0.6007080078125, -0.54827880859375, -0.495849609375, -0.44342041015625, -0.3909912109375, -0.33856201171875, -0.2861328125, -0.23370361328125, -0.1812744140625, -0.12884521484375, -0.076416015625, -0.02398681640625, 0.0284423828125, 0.08087158203125, 0.13330078125, 0.18572998046875, 0.2381591796875, 0.29058837890625, 0.343017578125, 0.39544677734375, 0.4478759765625, 0.50030517578125, 0.552734375, 0.60516357421875, 0.6575927734375, 0.71002197265625, 0.762451171875, 0.81488037109375, 0.8673095703125, 0.91973876953125, 0.97216796875, 1.02459716796875, 1.0770263671875, 1.12945556640625, 1.181884765625, 1.23431396484375, 1.2867431640625, 1.33917236328125, 1.3916015625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 9.0, 6.0, 6.0, 20.0, 16.0, 18.0, 17.0, 23.0, 26.0, 32.0, 32.0, 31.0, 59.0, 69.0, 46.0, 74.0, 63.0, 52.0, 63.0, 56.0, 36.0, 32.0, 27.0, 25.0, 24.0, 25.0, 16.0, 11.0, 9.0, 10.0, 4.0, 9.0, 4.0, 7.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0008401870727539062, -0.0008170157670974731, -0.00079384446144104, -0.0007706731557846069, -0.0007475018501281738, -0.0007243305444717407, -0.0007011592388153076, -0.0006779879331588745, -0.0006548166275024414, -0.0006316453218460083, -0.0006084740161895752, -0.0005853027105331421, -0.000562131404876709, -0.0005389600992202759, -0.0005157887935638428, -0.0004926174879074097, -0.00046944618225097656, -0.00044627487659454346, -0.00042310357093811035, -0.00039993226528167725, -0.00037676095962524414, -0.00035358965396881104, -0.00033041834831237793, -0.0003072470426559448, -0.0002840757369995117, -0.0002609044313430786, -0.0002377331256866455, -0.0002145618200302124, -0.0001913905143737793, -0.0001682192087173462, -0.00014504790306091309, -0.00012187659740447998, -9.870529174804688e-05, -7.553398609161377e-05, -5.2362680435180664e-05, -2.919137477874756e-05, -6.020069122314453e-06, 1.7151236534118652e-05, 4.032254219055176e-05, 6.349384784698486e-05, 8.666515350341797e-05, 0.00010983645915985107, 0.00013300776481628418, 0.00015617907047271729, 0.0001793503761291504, 0.0002025216817855835, 0.0002256929874420166, 0.0002488642930984497, 0.0002720355987548828, 0.0002952069044113159, 0.000318378210067749, 0.00034154951572418213, 0.00036472082138061523, 0.00038789212703704834, 0.00041106343269348145, 0.00043423473834991455, 0.00045740604400634766, 0.00048057734966278076, 0.0005037486553192139, 0.000526919960975647, 0.0005500912666320801, 0.0005732625722885132, 0.0005964338779449463, 0.0006196051836013794, 0.0006427764892578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 7.0, 8.0, 6.0, 7.0, 2.0, 11.0, 12.0, 12.0, 16.0, 18.0, 24.0, 47.0, 36.0, 85.0, 74.0, 163.0, 326.0, 779.0, 23358.0, 1018685.0, 3590.0, 581.0, 253.0, 147.0, 81.0, 46.0, 41.0, 29.0, 11.0, 23.0, 21.0, 8.0, 7.0, 4.0, 7.0, 8.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.01528167724609375, -0.014722943305969238, -0.014164209365844727, -0.013605475425720215, -0.013046741485595703, -0.012488007545471191, -0.01192927360534668, -0.011370539665222168, -0.010811805725097656, -0.010253071784973145, -0.009694337844848633, -0.009135603904724121, -0.00857686996459961, -0.008018136024475098, -0.007459402084350586, -0.006900668144226074, -0.0063419342041015625, -0.005783200263977051, -0.005224466323852539, -0.004665732383728027, -0.004106998443603516, -0.003548264503479004, -0.002989530563354492, -0.0024307966232299805, -0.0018720626831054688, -0.001313328742980957, -0.0007545948028564453, -0.0001958608627319336, 0.0003628730773925781, 0.0009216070175170898, 0.0014803409576416016, 0.0020390748977661133, 0.002597808837890625, 0.0031565427780151367, 0.0037152767181396484, 0.00427401065826416, 0.004832744598388672, 0.005391478538513184, 0.005950212478637695, 0.006508946418762207, 0.007067680358886719, 0.0076264142990112305, 0.008185148239135742, 0.008743882179260254, 0.009302616119384766, 0.009861350059509277, 0.010420083999633789, 0.0109788179397583, 0.011537551879882812, 0.012096285820007324, 0.012655019760131836, 0.013213753700256348, 0.01377248764038086, 0.014331221580505371, 0.014889955520629883, 0.015448689460754395, 0.016007423400878906, 0.016566157341003418, 0.01712489128112793, 0.01768362522125244, 0.018242359161376953, 0.018801093101501465, 0.019359827041625977, 0.01991856098175049, 0.020477294921875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 28.0, 60.0, 111.0, 181.0, 223.0, 204.0, 111.0, 56.0, 19.0, 8.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0013808677904307842, -0.00135238585062325, -0.0013239039108157158, -0.0012954219710081816, -0.0012669400312006474, -0.0012384579749777913, -0.001209976035170257, -0.0011814940953627229, -0.0011530121555551887, -0.0011245302157476544, -0.0010960482759401202, -0.001067566336132586, -0.00103908427990973, -0.0010106023401021957, -0.0009821204002946615, -0.0009536384604871273, -0.0009251565206795931, -0.0008966745808720589, -0.0008681926410645247, -0.0008397106430493295, -0.0008112287032417953, -0.0007827467634342611, -0.000754264765419066, -0.0007257828256115317, -0.0006973008858039975, -0.0006688189459964633, -0.0006403370061889291, -0.000611855008173734, -0.0005833730683661997, -0.0005548911285586655, -0.0005264091305434704, -0.0004979271907359362, -0.00046944530913606286, -0.00044096336932852864, -0.00041248140041716397, -0.0003839994315057993, -0.0003555174916982651, -0.00032703555189073086, -0.0002985535829793662, -0.0002700716140680015, -0.0002415896742604673, -0.00021310771990101784, -0.0001846257655415684, -0.00015614381118211895, -0.0001276618568226695, -9.917990246322006e-05, -7.069794810377061e-05, -4.221599374432117e-05, -1.3734039384871721e-05, 1.4747914974577725e-05, 4.322986933402717e-05, 7.171182369347662e-05, 0.00010019377805292606, 0.0001286757324123755, 0.00015715768677182496, 0.0001856396411312744, 0.00021412159549072385, 0.0002426035498501733, 0.00027108550420962274, 0.0002995674731209874, 0.00032804941292852163, 0.00035653135273605585, 0.0003850133216474205, 0.0004134952905587852, 0.0004419772303663194]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 7.0, 7.0, 8.0, 11.0, 12.0, 12.0, 14.0, 15.0, 16.0, 22.0, 27.0, 33.0, 25.0, 27.0, 29.0, 36.0, 37.0, 40.0, 40.0, 51.0, 39.0, 36.0, 30.0, 48.0, 44.0, 41.0, 31.0, 20.0, 29.0, 25.0, 30.0, 21.0, 15.0, 20.0, 15.0, 13.0, 16.0, 12.0, 9.0, 4.0, 6.0, 7.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00038677453994750977, -0.0003746272996068001, -0.0003624800592660904, -0.0003503328189253807, -0.000338185578584671, -0.00032603833824396133, -0.00031389109790325165, -0.00030174385756254196, -0.0002895966172218323, -0.0002774493768811226, -0.0002653021365404129, -0.0002531548961997032, -0.00024100765585899353, -0.00022886041551828384, -0.00021671317517757416, -0.00020456593483686447, -0.00019241869449615479, -0.0001802714541554451, -0.0001681242138147354, -0.00015597697347402573, -0.00014382973313331604, -0.00013168249279260635, -0.00011953525245189667, -0.00010738801211118698, -9.52407717704773e-05, -8.309353142976761e-05, -7.094629108905792e-05, -5.8799050748348236e-05, -4.665181040763855e-05, -3.4504570066928864e-05, -2.2357329726219177e-05, -1.0210089385509491e-05, 1.9371509552001953e-06, 1.4084391295909882e-05, 2.6231631636619568e-05, 3.8378871977329254e-05, 5.052611231803894e-05, 6.267335265874863e-05, 7.482059299945831e-05, 8.6967833340168e-05, 9.911507368087769e-05, 0.00011126231402158737, 0.00012340955436229706, 0.00013555679470300674, 0.00014770403504371643, 0.00015985127538442612, 0.0001719985157251358, 0.0001841457560658455, 0.00019629299640655518, 0.00020844023674726486, 0.00022058747708797455, 0.00023273471742868423, 0.0002448819577693939, 0.0002570291981101036, 0.0002691764384508133, 0.000281323678791523, 0.00029347091913223267, 0.00030561815947294235, 0.00031776539981365204, 0.0003299126401543617, 0.0003420598804950714, 0.0003542071208357811, 0.0003663543611764908, 0.00037850160151720047, 0.00039064884185791016]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 13.0, 11.0, 16.0, 12.0, 9.0, 15.0, 17.0, 17.0, 23.0, 33.0, 29.0, 20.0, 36.0, 38.0, 28.0, 47.0, 38.0, 38.0, 39.0, 42.0, 27.0, 31.0, 38.0, 28.0, 37.0, 35.0, 29.0, 28.0, 25.0, 21.0, 19.0, 21.0, 18.0, 24.0, 17.0, 12.0, 17.0, 12.0, 8.0, 7.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.98828125, -4.8350830078125, -4.681884765625, -4.5286865234375, -4.37548828125, -4.2222900390625, -4.069091796875, -3.9158935546875, -3.7626953125, -3.6094970703125, -3.456298828125, -3.3031005859375, -3.14990234375, -2.9967041015625, -2.843505859375, -2.6903076171875, -2.537109375, -2.3839111328125, -2.230712890625, -2.0775146484375, -1.92431640625, -1.7711181640625, -1.617919921875, -1.4647216796875, -1.3115234375, -1.1583251953125, -1.005126953125, -0.8519287109375, -0.69873046875, -0.5455322265625, -0.392333984375, -0.2391357421875, -0.0859375, 0.0672607421875, 0.220458984375, 0.3736572265625, 0.52685546875, 0.6800537109375, 0.833251953125, 0.9864501953125, 1.1396484375, 1.2928466796875, 1.446044921875, 1.5992431640625, 1.75244140625, 1.9056396484375, 2.058837890625, 2.2120361328125, 2.365234375, 2.5184326171875, 2.671630859375, 2.8248291015625, 2.97802734375, 3.1312255859375, 3.284423828125, 3.4376220703125, 3.5908203125, 3.7440185546875, 3.897216796875, 4.0504150390625, 4.20361328125, 4.3568115234375, 4.510009765625, 4.6632080078125, 4.81640625]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 8.0, 6.0, 16.0, 15.0, 33.0, 28.0, 46.0, 77.0, 109.0, 154.0, 244.0, 385.0, 631.0, 937.0, 1587.0, 2454.0, 4056.0, 6880.0, 12796.0, 24925.0, 54196.0, 124172.0, 304811.0, 288160.0, 117130.0, 51378.0, 24084.0, 12126.0, 6707.0, 3919.0, 2362.0, 1500.0, 909.0, 547.0, 385.0, 265.0, 164.0, 95.0, 82.0, 64.0, 30.0, 18.0, 16.0, 17.0, 6.0, 6.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.880859375, -2.790740966796875, -2.70062255859375, -2.610504150390625, -2.5203857421875, -2.430267333984375, -2.34014892578125, -2.250030517578125, -2.159912109375, -2.069793701171875, -1.97967529296875, -1.889556884765625, -1.7994384765625, -1.709320068359375, -1.61920166015625, -1.529083251953125, -1.43896484375, -1.348846435546875, -1.25872802734375, -1.168609619140625, -1.0784912109375, -0.988372802734375, -0.89825439453125, -0.808135986328125, -0.718017578125, -0.627899169921875, -0.53778076171875, -0.447662353515625, -0.3575439453125, -0.267425537109375, -0.17730712890625, -0.087188720703125, 0.0029296875, 0.093048095703125, 0.18316650390625, 0.273284912109375, 0.3634033203125, 0.453521728515625, 0.54364013671875, 0.633758544921875, 0.723876953125, 0.813995361328125, 0.90411376953125, 0.994232177734375, 1.0843505859375, 1.174468994140625, 1.26458740234375, 1.354705810546875, 1.44482421875, 1.534942626953125, 1.62506103515625, 1.715179443359375, 1.8052978515625, 1.895416259765625, 1.98553466796875, 2.075653076171875, 2.165771484375, 2.255889892578125, 2.34600830078125, 2.436126708984375, 2.5262451171875, 2.616363525390625, 2.70648193359375, 2.796600341796875, 2.88671875]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 3.0, 3.0, 7.0, 6.0, 8.0, 11.0, 12.0, 18.0, 24.0, 16.0, 22.0, 31.0, 38.0, 38.0, 45.0, 48.0, 48.0, 63.0, 96.0, 242.0, 1625.0, 180.0, 64.0, 58.0, 40.0, 46.0, 34.0, 36.0, 29.0, 27.0, 18.0, 15.0, 26.0, 18.0, 18.0, 2.0, 7.0, 2.0, 6.0, 2.0, 7.0, 4.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.203125, -19.57861328125, -18.9541015625, -18.32958984375, -17.705078125, -17.08056640625, -16.4560546875, -15.83154296875, -15.20703125, -14.58251953125, -13.9580078125, -13.33349609375, -12.708984375, -12.08447265625, -11.4599609375, -10.83544921875, -10.2109375, -9.58642578125, -8.9619140625, -8.33740234375, -7.712890625, -7.08837890625, -6.4638671875, -5.83935546875, -5.21484375, -4.59033203125, -3.9658203125, -3.34130859375, -2.716796875, -2.09228515625, -1.4677734375, -0.84326171875, -0.21875, 0.40576171875, 1.0302734375, 1.65478515625, 2.279296875, 2.90380859375, 3.5283203125, 4.15283203125, 4.77734375, 5.40185546875, 6.0263671875, 6.65087890625, 7.275390625, 7.89990234375, 8.5244140625, 9.14892578125, 9.7734375, 10.39794921875, 11.0224609375, 11.64697265625, 12.271484375, 12.89599609375, 13.5205078125, 14.14501953125, 14.76953125, 15.39404296875, 16.0185546875, 16.64306640625, 17.267578125, 17.89208984375, 18.5166015625, 19.14111328125, 19.765625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 3.0, 6.0, 7.0, 14.0, 15.0, 24.0, 37.0, 58.0, 81.0, 138.0, 232.0, 442.0, 1671.0, 1292932.0, 1847169.0, 1720.0, 484.0, 262.0, 156.0, 68.0, 57.0, 42.0, 28.0, 13.0, 15.0, 12.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.28125, -55.07861328125, -52.8759765625, -50.67333984375, -48.470703125, -46.26806640625, -44.0654296875, -41.86279296875, -39.66015625, -37.45751953125, -35.2548828125, -33.05224609375, -30.849609375, -28.64697265625, -26.4443359375, -24.24169921875, -22.0390625, -19.83642578125, -17.6337890625, -15.43115234375, -13.228515625, -11.02587890625, -8.8232421875, -6.62060546875, -4.41796875, -2.21533203125, -0.0126953125, 2.18994140625, 4.392578125, 6.59521484375, 8.7978515625, 11.00048828125, 13.203125, 15.40576171875, 17.6083984375, 19.81103515625, 22.013671875, 24.21630859375, 26.4189453125, 28.62158203125, 30.82421875, 33.02685546875, 35.2294921875, 37.43212890625, 39.634765625, 41.83740234375, 44.0400390625, 46.24267578125, 48.4453125, 50.64794921875, 52.8505859375, 55.05322265625, 57.255859375, 59.45849609375, 61.6611328125, 63.86376953125, 66.06640625, 68.26904296875, 70.4716796875, 72.67431640625, 74.876953125, 77.07958984375, 79.2822265625, 81.48486328125, 83.6875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 9.0, 6.0, 11.0, 25.0, 25.0, 50.0, 76.0, 82.0, 93.0, 105.0, 111.0, 89.0, 80.0, 74.0, 55.0, 39.0, 22.0, 21.0, 8.0, 8.0, 6.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.651729583740234, -9.11793041229248, -8.58413028717041, -8.050331115722656, -7.516531467437744, -6.982731819152832, -6.448932647705078, -5.915132999420166, -5.381333351135254, -4.847533702850342, -4.31373405456543, -3.779934883117676, -3.2461352348327637, -2.7123355865478516, -2.1785361766815186, -1.6447367668151855, -1.1109371185302734, -0.5771375894546509, -0.04333806037902832, 0.49046146869659424, 1.0242609977722168, 1.558060646057129, 2.091860055923462, 2.625659465789795, 3.159459114074707, 3.693258762359619, 4.227058410644531, 4.760857582092285, 5.294657230377197, 5.828456878662109, 6.362256050109863, 6.896055698394775, 7.4298553466796875, 7.9636549949646, 8.497454643249512, 9.031253814697266, 9.565053939819336, 10.09885311126709, 10.632652282714844, 11.166452407836914, 11.700251579284668, 12.234050750732422, 12.767850875854492, 13.301650047302246, 13.83544921875, 14.36924934387207, 14.903048515319824, 15.436847686767578, 15.970647811889648, 16.50444793701172, 17.038246154785156, 17.572046279907227, 18.105846405029297, 18.639644622802734, 19.173444747924805, 19.707244873046875, 20.241043090820312, 20.774843215942383, 21.30864143371582, 21.84244155883789, 22.37624168395996, 22.91004180908203, 23.44384002685547, 23.97764015197754, 24.51144027709961]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 7.0, 9.0, 5.0, 11.0, 18.0, 15.0, 16.0, 16.0, 31.0, 22.0, 20.0, 28.0, 44.0, 13.0, 38.0, 32.0, 36.0, 44.0, 44.0, 46.0, 47.0, 43.0, 42.0, 40.0, 52.0, 34.0, 27.0, 28.0, 26.0, 21.0, 26.0, 18.0, 11.0, 15.0, 13.0, 14.0, 8.0, 6.0, 11.0, 2.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.19717788696289, -55.53896713256836, -53.88075637817383, -52.2225456237793, -50.564334869384766, -48.906124114990234, -47.24791717529297, -45.58970642089844, -43.931495666503906, -42.273284912109375, -40.615074157714844, -38.95686340332031, -37.29865264892578, -35.64044189453125, -33.98223114013672, -32.32402038574219, -30.665809631347656, -29.007598876953125, -27.349388122558594, -25.691177368164062, -24.03296661376953, -22.374755859375, -20.7165470123291, -19.05833625793457, -17.40012550354004, -15.741914749145508, -14.083703994750977, -12.425494194030762, -10.76728343963623, -9.1090726852417, -7.450862884521484, -5.792652130126953, -4.134437561035156, -2.476227045059204, -0.818016529083252, 0.8401937484741211, 2.4984045028686523, 4.156615257263184, 5.814825057983398, 7.47303581237793, 9.131246566772461, 10.789457321166992, 12.447668075561523, 14.105877876281738, 15.76408863067627, 17.422298431396484, 19.080509185791016, 20.738719940185547, 22.396930694580078, 24.05514144897461, 25.71335220336914, 27.371562957763672, 29.029773712158203, 30.687984466552734, 32.34619140625, 34.00440216064453, 35.66261291503906, 37.320823669433594, 38.979034423828125, 40.637245178222656, 42.29545593261719, 43.95366668701172, 45.61187744140625, 47.27008819580078, 48.92829895019531]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 5.0, 14.0, 9.0, 10.0, 8.0, 12.0, 18.0, 18.0, 16.0, 16.0, 31.0, 27.0, 28.0, 29.0, 37.0, 37.0, 44.0, 37.0, 47.0, 45.0, 29.0, 46.0, 28.0, 33.0, 37.0, 39.0, 45.0, 18.0, 23.0, 30.0, 17.0, 28.0, 31.0, 14.0, 18.0, 11.0, 13.0, 17.0, 17.0, 9.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.35125732421875, -5.1829833984375, -5.01470947265625, -4.846435546875, -4.67816162109375, -4.5098876953125, -4.34161376953125, -4.17333984375, -4.00506591796875, -3.8367919921875, -3.66851806640625, -3.500244140625, -3.33197021484375, -3.1636962890625, -2.99542236328125, -2.8271484375, -2.65887451171875, -2.4906005859375, -2.32232666015625, -2.154052734375, -1.98577880859375, -1.8175048828125, -1.64923095703125, -1.48095703125, -1.31268310546875, -1.1444091796875, -0.97613525390625, -0.807861328125, -0.63958740234375, -0.4713134765625, -0.30303955078125, -0.134765625, 0.03350830078125, 0.2017822265625, 0.37005615234375, 0.538330078125, 0.70660400390625, 0.8748779296875, 1.04315185546875, 1.21142578125, 1.37969970703125, 1.5479736328125, 1.71624755859375, 1.884521484375, 2.05279541015625, 2.2210693359375, 2.38934326171875, 2.5576171875, 2.72589111328125, 2.8941650390625, 3.06243896484375, 3.230712890625, 3.39898681640625, 3.5672607421875, 3.73553466796875, 3.90380859375, 4.07208251953125, 4.2403564453125, 4.40863037109375, 4.576904296875, 4.74517822265625, 4.9134521484375, 5.08172607421875, 5.25]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 5.0, 8.0, 17.0, 17.0, 31.0, 29.0, 49.0, 48.0, 66.0, 117.0, 160.0, 224.0, 379.0, 690.0, 1290.0, 3210.0, 8892.0, 32317.0, 169318.0, 850720.0, 1805007.0, 1042281.0, 219202.0, 41595.0, 10998.0, 3959.0, 1608.0, 776.0, 415.0, 236.0, 159.0, 109.0, 96.0, 69.0, 43.0, 42.0, 17.0, 18.0, 13.0, 18.0, 11.0, 9.0, 7.0, 3.0, 0.0, 2.0, 0.0, 2.0], "bins": [-9.1875, -8.93634033203125, -8.6851806640625, -8.43402099609375, -8.182861328125, -7.93170166015625, -7.6805419921875, -7.42938232421875, -7.17822265625, -6.92706298828125, -6.6759033203125, -6.42474365234375, -6.173583984375, -5.92242431640625, -5.6712646484375, -5.42010498046875, -5.1689453125, -4.91778564453125, -4.6666259765625, -4.41546630859375, -4.164306640625, -3.91314697265625, -3.6619873046875, -3.41082763671875, -3.15966796875, -2.90850830078125, -2.6573486328125, -2.40618896484375, -2.155029296875, -1.90386962890625, -1.6527099609375, -1.40155029296875, -1.150390625, -0.89923095703125, -0.6480712890625, -0.39691162109375, -0.145751953125, 0.10540771484375, 0.3565673828125, 0.60772705078125, 0.85888671875, 1.11004638671875, 1.3612060546875, 1.61236572265625, 1.863525390625, 2.11468505859375, 2.3658447265625, 2.61700439453125, 2.8681640625, 3.11932373046875, 3.3704833984375, 3.62164306640625, 3.872802734375, 4.12396240234375, 4.3751220703125, 4.62628173828125, 4.87744140625, 5.12860107421875, 5.3797607421875, 5.63092041015625, 5.882080078125, 6.13323974609375, 6.3843994140625, 6.63555908203125, 6.88671875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 2.0, 5.0, 8.0, 12.0, 12.0, 21.0, 29.0, 35.0, 31.0, 76.0, 86.0, 108.0, 139.0, 194.0, 215.0, 312.0, 396.0, 390.0, 426.0, 381.0, 307.0, 214.0, 158.0, 132.0, 103.0, 59.0, 65.0, 44.0, 33.0, 25.0, 12.0, 14.0, 8.0, 4.0, 9.0, 3.0, 6.0, 2.0, 3.0, 0.0, 3.0], "bins": [-14.96875, -14.6025390625, -14.236328125, -13.8701171875, -13.50390625, -13.1376953125, -12.771484375, -12.4052734375, -12.0390625, -11.6728515625, -11.306640625, -10.9404296875, -10.57421875, -10.2080078125, -9.841796875, -9.4755859375, -9.109375, -8.7431640625, -8.376953125, -8.0107421875, -7.64453125, -7.2783203125, -6.912109375, -6.5458984375, -6.1796875, -5.8134765625, -5.447265625, -5.0810546875, -4.71484375, -4.3486328125, -3.982421875, -3.6162109375, -3.25, -2.8837890625, -2.517578125, -2.1513671875, -1.78515625, -1.4189453125, -1.052734375, -0.6865234375, -0.3203125, 0.0458984375, 0.412109375, 0.7783203125, 1.14453125, 1.5107421875, 1.876953125, 2.2431640625, 2.609375, 2.9755859375, 3.341796875, 3.7080078125, 4.07421875, 4.4404296875, 4.806640625, 5.1728515625, 5.5390625, 5.9052734375, 6.271484375, 6.6376953125, 7.00390625, 7.3701171875, 7.736328125, 8.1025390625, 8.46875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 5.0, 7.0, 15.0, 21.0, 17.0, 23.0, 31.0, 53.0, 78.0, 79.0, 124.0, 176.0, 270.0, 473.0, 1657.0, 91529.0, 4049841.0, 47233.0, 1305.0, 463.0, 263.0, 178.0, 111.0, 85.0, 63.0, 37.0, 31.0, 28.0, 14.0, 16.0, 17.0, 13.0, 6.0, 6.0, 8.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-51.28125, -49.650390625, -48.01953125, -46.388671875, -44.7578125, -43.126953125, -41.49609375, -39.865234375, -38.234375, -36.603515625, -34.97265625, -33.341796875, -31.7109375, -30.080078125, -28.44921875, -26.818359375, -25.1875, -23.556640625, -21.92578125, -20.294921875, -18.6640625, -17.033203125, -15.40234375, -13.771484375, -12.140625, -10.509765625, -8.87890625, -7.248046875, -5.6171875, -3.986328125, -2.35546875, -0.724609375, 0.90625, 2.537109375, 4.16796875, 5.798828125, 7.4296875, 9.060546875, 10.69140625, 12.322265625, 13.953125, 15.583984375, 17.21484375, 18.845703125, 20.4765625, 22.107421875, 23.73828125, 25.369140625, 27.0, 28.630859375, 30.26171875, 31.892578125, 33.5234375, 35.154296875, 36.78515625, 38.416015625, 40.046875, 41.677734375, 43.30859375, 44.939453125, 46.5703125, 48.201171875, 49.83203125, 51.462890625, 53.09375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 38.0, 64.0, 137.0, 211.0, 227.0, 164.0, 91.0, 40.0, 15.0, 9.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.77938079833984, -100.75592041015625, -97.73246002197266, -94.70899963378906, -91.68553161621094, -88.66207122802734, -85.63861083984375, -82.61515045166016, -79.59169006347656, -76.56822967529297, -73.54476928710938, -70.52130126953125, -67.49784088134766, -64.47438049316406, -61.45092010498047, -58.427459716796875, -55.403995513916016, -52.38053512573242, -49.35707092285156, -46.33361053466797, -43.310150146484375, -40.28668975830078, -37.26322555541992, -34.23976516723633, -31.2163028717041, -28.192840576171875, -25.16938018798828, -22.145917892456055, -19.122455596923828, -16.098995208740234, -13.075532913208008, -10.052072525024414, -7.0286102294921875, -4.005148887634277, -0.981687068939209, 2.0417747497558594, 5.0652360916137695, 8.08869743347168, 11.112159729003906, 14.1356201171875, 17.159082412719727, 20.182544708251953, 23.206005096435547, 26.229467391967773, 29.2529296875, 32.276390075683594, 35.29985046386719, 38.32331085205078, 41.34677505493164, 44.370235443115234, 47.393699645996094, 50.41716003417969, 53.44062042236328, 56.464080810546875, 59.487545013427734, 62.51100540161133, 65.53446960449219, 68.55792999267578, 71.58139038085938, 74.6048583984375, 77.6283187866211, 80.65177917480469, 83.67523956298828, 86.69869995117188, 89.72216033935547]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 3.0, 6.0, 8.0, 8.0, 6.0, 19.0, 12.0, 14.0, 14.0, 20.0, 15.0, 16.0, 24.0, 16.0, 37.0, 31.0, 40.0, 33.0, 38.0, 38.0, 32.0, 24.0, 33.0, 47.0, 39.0, 34.0, 35.0, 30.0, 29.0, 28.0, 31.0, 25.0, 28.0, 20.0, 25.0, 19.0, 18.0, 15.0, 16.0, 12.0, 12.0, 9.0, 3.0, 7.0, 5.0, 6.0, 1.0, 5.0, 5.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-34.1158447265625, -33.0200309753418, -31.924217224121094, -30.828401565551758, -29.732587814331055, -28.63677406311035, -27.540958404541016, -26.445144653320312, -25.34933090209961, -24.253517150878906, -23.157703399658203, -22.061887741088867, -20.966073989868164, -19.87026023864746, -18.774444580078125, -17.678630828857422, -16.58281707763672, -15.487003326416016, -14.391188621520996, -13.295373916625977, -12.199560165405273, -11.10374641418457, -10.00793170928955, -8.912117004394531, -7.816303253173828, -6.720489025115967, -5.6246747970581055, -4.528860569000244, -3.433046340942383, -2.3372321128845215, -1.2414178848266602, -0.14560365676879883, 0.9502105712890625, 2.046024799346924, 3.141839027404785, 4.2376532554626465, 5.333467483520508, 6.429281711578369, 7.5250959396362305, 8.62091064453125, 9.716724395751953, 10.812538146972656, 11.908352851867676, 13.004167556762695, 14.099981307983398, 15.195795059204102, 16.291610717773438, 17.38742446899414, 18.483238220214844, 19.579051971435547, 20.67486572265625, 21.770681381225586, 22.86649513244629, 23.962308883666992, 25.058124542236328, 26.15393829345703, 27.249752044677734, 28.345565795898438, 29.44137954711914, 30.537195205688477, 31.63300895690918, 32.728824615478516, 33.82463836669922, 34.92045211791992, 36.016265869140625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 13.0, 11.0, 14.0, 13.0, 14.0, 18.0, 23.0, 24.0, 25.0, 31.0, 22.0, 36.0, 30.0, 35.0, 44.0, 43.0, 44.0, 45.0, 42.0, 41.0, 38.0, 35.0, 30.0, 44.0, 42.0, 32.0, 23.0, 21.0, 20.0, 15.0, 24.0, 16.0, 22.0, 10.0, 12.0, 13.0, 5.0, 9.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.22540283203125, -5.0523681640625, -4.87933349609375, -4.706298828125, -4.53326416015625, -4.3602294921875, -4.18719482421875, -4.01416015625, -3.84112548828125, -3.6680908203125, -3.49505615234375, -3.322021484375, -3.14898681640625, -2.9759521484375, -2.80291748046875, -2.6298828125, -2.45684814453125, -2.2838134765625, -2.11077880859375, -1.937744140625, -1.76470947265625, -1.5916748046875, -1.41864013671875, -1.24560546875, -1.07257080078125, -0.8995361328125, -0.72650146484375, -0.553466796875, -0.38043212890625, -0.2073974609375, -0.03436279296875, 0.138671875, 0.31170654296875, 0.4847412109375, 0.65777587890625, 0.830810546875, 1.00384521484375, 1.1768798828125, 1.34991455078125, 1.52294921875, 1.69598388671875, 1.8690185546875, 2.04205322265625, 2.215087890625, 2.38812255859375, 2.5611572265625, 2.73419189453125, 2.9072265625, 3.08026123046875, 3.2532958984375, 3.42633056640625, 3.599365234375, 3.77239990234375, 3.9454345703125, 4.11846923828125, 4.29150390625, 4.46453857421875, 4.6375732421875, 4.81060791015625, 4.983642578125, 5.15667724609375, 5.3297119140625, 5.50274658203125, 5.67578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 6.0, 4.0, 7.0, 11.0, 18.0, 17.0, 19.0, 51.0, 63.0, 89.0, 153.0, 228.0, 302.0, 481.0, 688.0, 1042.0, 1521.0, 2197.0, 3234.0, 4636.0, 6990.0, 10330.0, 15362.0, 23349.0, 36120.0, 58556.0, 100943.0, 228678.0, 264392.0, 111487.0, 63220.0, 39139.0, 24890.0, 16307.0, 10884.0, 7400.0, 5048.0, 3472.0, 2342.0, 1584.0, 1039.0, 715.0, 491.0, 342.0, 238.0, 138.0, 112.0, 86.0, 45.0, 34.0, 27.0, 12.0, 9.0, 8.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0027923583984375, -0.969451904296875, -0.9361114501953125, -0.90277099609375, -0.8694305419921875, -0.836090087890625, -0.8027496337890625, -0.7694091796875, -0.7360687255859375, -0.702728271484375, -0.6693878173828125, -0.63604736328125, -0.6027069091796875, -0.569366455078125, -0.5360260009765625, -0.502685546875, -0.4693450927734375, -0.436004638671875, -0.4026641845703125, -0.36932373046875, -0.3359832763671875, -0.302642822265625, -0.2693023681640625, -0.2359619140625, -0.2026214599609375, -0.169281005859375, -0.1359405517578125, -0.10260009765625, -0.0692596435546875, -0.035919189453125, -0.0025787353515625, 0.03076171875, 0.0641021728515625, 0.097442626953125, 0.1307830810546875, 0.16412353515625, 0.1974639892578125, 0.230804443359375, 0.2641448974609375, 0.2974853515625, 0.3308258056640625, 0.364166259765625, 0.3975067138671875, 0.43084716796875, 0.4641876220703125, 0.497528076171875, 0.5308685302734375, 0.564208984375, 0.5975494384765625, 0.630889892578125, 0.6642303466796875, 0.69757080078125, 0.7309112548828125, 0.764251708984375, 0.7975921630859375, 0.8309326171875, 0.8642730712890625, 0.897613525390625, 0.9309539794921875, 0.96429443359375, 0.9976348876953125, 1.030975341796875, 1.0643157958984375, 1.09765625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 6.0, 12.0, 9.0, 6.0, 7.0, 10.0, 15.0, 14.0, 21.0, 27.0, 24.0, 22.0, 26.0, 25.0, 29.0, 23.0, 33.0, 30.0, 41.0, 55.0, 1061.0, 35.0, 39.0, 39.0, 50.0, 40.0, 36.0, 44.0, 43.0, 26.0, 17.0, 33.0, 21.0, 23.0, 10.0, 17.0, 13.0, 8.0, 8.0, 5.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.34765625, -3.238677978515625, -3.12969970703125, -3.020721435546875, -2.9117431640625, -2.802764892578125, -2.69378662109375, -2.584808349609375, -2.475830078125, -2.366851806640625, -2.25787353515625, -2.148895263671875, -2.0399169921875, -1.930938720703125, -1.82196044921875, -1.712982177734375, -1.60400390625, -1.495025634765625, -1.38604736328125, -1.277069091796875, -1.1680908203125, -1.059112548828125, -0.95013427734375, -0.841156005859375, -0.732177734375, -0.623199462890625, -0.51422119140625, -0.405242919921875, -0.2962646484375, -0.187286376953125, -0.07830810546875, 0.030670166015625, 0.1396484375, 0.248626708984375, 0.35760498046875, 0.466583251953125, 0.5755615234375, 0.684539794921875, 0.79351806640625, 0.902496337890625, 1.011474609375, 1.120452880859375, 1.22943115234375, 1.338409423828125, 1.4473876953125, 1.556365966796875, 1.66534423828125, 1.774322509765625, 1.88330078125, 1.992279052734375, 2.10125732421875, 2.210235595703125, 2.3192138671875, 2.428192138671875, 2.53717041015625, 2.646148681640625, 2.755126953125, 2.864105224609375, 2.97308349609375, 3.082061767578125, 3.1910400390625, 3.300018310546875, 3.40899658203125, 3.517974853515625, 3.626953125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 9.0, 3.0, 12.0, 14.0, 25.0, 33.0, 52.0, 93.0, 167.0, 260.0, 524.0, 942.0, 1660.0, 3145.0, 5908.0, 11387.0, 22284.0, 45199.0, 97264.0, 298360.0, 1401871.0, 108275.0, 49118.0, 24375.0, 12366.0, 6291.0, 3457.0, 1755.0, 996.0, 564.0, 289.0, 156.0, 93.0, 61.0, 38.0, 18.0, 11.0, 8.0, 6.0, 18.0, 4.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7392578125, -1.6866455078125, -1.634033203125, -1.5814208984375, -1.52880859375, -1.4761962890625, -1.423583984375, -1.3709716796875, -1.318359375, -1.2657470703125, -1.213134765625, -1.1605224609375, -1.10791015625, -1.0552978515625, -1.002685546875, -0.9500732421875, -0.8974609375, -0.8448486328125, -0.792236328125, -0.7396240234375, -0.68701171875, -0.6343994140625, -0.581787109375, -0.5291748046875, -0.4765625, -0.4239501953125, -0.371337890625, -0.3187255859375, -0.26611328125, -0.2135009765625, -0.160888671875, -0.1082763671875, -0.0556640625, -0.0030517578125, 0.049560546875, 0.1021728515625, 0.15478515625, 0.2073974609375, 0.260009765625, 0.3126220703125, 0.365234375, 0.4178466796875, 0.470458984375, 0.5230712890625, 0.57568359375, 0.6282958984375, 0.680908203125, 0.7335205078125, 0.7861328125, 0.8387451171875, 0.891357421875, 0.9439697265625, 0.99658203125, 1.0491943359375, 1.101806640625, 1.1544189453125, 1.20703125, 1.2596435546875, 1.312255859375, 1.3648681640625, 1.41748046875, 1.4700927734375, 1.522705078125, 1.5753173828125, 1.6279296875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 5.0, 7.0, 7.0, 7.0, 14.0, 11.0, 27.0, 29.0, 30.0, 49.0, 79.0, 82.0, 92.0, 103.0, 94.0, 80.0, 76.0, 55.0, 42.0, 32.0, 13.0, 14.0, 15.0, 9.0, 8.0, 4.0, 4.0, 8.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007786750793457031, -0.0007521137595176697, -0.0007255524396896362, -0.0006989911198616028, -0.0006724298000335693, -0.0006458684802055359, -0.0006193071603775024, -0.000592745840549469, -0.0005661845207214355, -0.0005396232008934021, -0.0005130618810653687, -0.0004865005612373352, -0.00045993924140930176, -0.0004333779215812683, -0.00040681660175323486, -0.0003802552819252014, -0.00035369396209716797, -0.0003271326422691345, -0.0003005713224411011, -0.0002740100026130676, -0.0002474486827850342, -0.00022088736295700073, -0.00019432604312896729, -0.00016776472330093384, -0.0001412034034729004, -0.00011464208364486694, -8.80807638168335e-05, -6.151944398880005e-05, -3.49581241607666e-05, -8.396804332733154e-06, 1.8164515495300293e-05, 4.472583532333374e-05, 7.128715515136719e-05, 9.784847497940063e-05, 0.00012440979480743408, 0.00015097111463546753, 0.00017753243446350098, 0.00020409375429153442, 0.00023065507411956787, 0.0002572163939476013, 0.00028377771377563477, 0.0003103390336036682, 0.00033690035343170166, 0.0003634616732597351, 0.00039002299308776855, 0.000416584312915802, 0.00044314563274383545, 0.0004697069525718689, 0.0004962682723999023, 0.0005228295922279358, 0.0005493909120559692, 0.0005759522318840027, 0.0006025135517120361, 0.0006290748715400696, 0.000655636191368103, 0.0006821975111961365, 0.0007087588310241699, 0.0007353201508522034, 0.0007618814706802368, 0.0007884427905082703, 0.0008150041103363037, 0.0008415654301643372, 0.0008681267499923706, 0.000894688069820404, 0.0009212493896484375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 4.0, 11.0, 9.0, 8.0, 17.0, 26.0, 33.0, 54.0, 87.0, 143.0, 287.0, 927.0, 655327.0, 390130.0, 872.0, 268.0, 122.0, 63.0, 47.0, 31.0, 18.0, 16.0, 13.0, 7.0, 5.0, 11.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0228118896484375, -0.022159576416015625, -0.02150726318359375, -0.020854949951171875, -0.02020263671875, -0.019550323486328125, -0.01889801025390625, -0.018245697021484375, -0.0175933837890625, -0.016941070556640625, -0.01628875732421875, -0.015636444091796875, -0.014984130859375, -0.014331817626953125, -0.01367950439453125, -0.013027191162109375, -0.0123748779296875, -0.011722564697265625, -0.01107025146484375, -0.010417938232421875, -0.009765625, -0.009113311767578125, -0.00846099853515625, -0.007808685302734375, -0.0071563720703125, -0.006504058837890625, -0.00585174560546875, -0.005199432373046875, -0.004547119140625, -0.003894805908203125, -0.00324249267578125, -0.002590179443359375, -0.0019378662109375, -0.001285552978515625, -0.00063323974609375, 1.9073486328125e-05, 0.00067138671875, 0.001323699951171875, 0.00197601318359375, 0.002628326416015625, 0.0032806396484375, 0.003932952880859375, 0.00458526611328125, 0.005237579345703125, 0.005889892578125, 0.006542205810546875, 0.00719451904296875, 0.007846832275390625, 0.0084991455078125, 0.009151458740234375, 0.00980377197265625, 0.010456085205078125, 0.0111083984375, 0.011760711669921875, 0.01241302490234375, 0.013065338134765625, 0.0137176513671875, 0.014369964599609375, 0.01502227783203125, 0.015674591064453125, 0.016326904296875, 0.016979217529296875, 0.01763153076171875, 0.018283843994140625, 0.0189361572265625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 41.0, 304.0, 487.0, 158.0, 22.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.003743014996871352, -0.0036753020249307156, -0.0036075888201594353, -0.0035398758482187986, -0.003472162876278162, -0.0034044496715068817, -0.003336736699566245, -0.0032690237276256084, -0.003201310522854328, -0.0031335975509136915, -0.0030658843461424112, -0.0029981713742017746, -0.002930458402261138, -0.0028627454303205013, -0.002795032225549221, -0.0027273192536085844, -0.0026596062816679478, -0.002591893309727311, -0.002524180104956031, -0.002456467133015394, -0.0023887541610747576, -0.002321041189134121, -0.0022533279843628407, -0.002185615012422204, -0.0021179020404815674, -0.0020501890685409307, -0.0019824758637696505, -0.0019147628918290138, -0.0018470499198883772, -0.0017793368315324187, -0.0017116237431764603, -0.0016439107712358236, -0.0015761974500492215, -0.001508484361693263, -0.0014407713897526264, -0.001373058301396668, -0.0013053452130407095, -0.0012376322411000729, -0.0011699191527441144, -0.001102206064388156, -0.0010344930924475193, -0.0009667800622992218, -0.0008990670321509242, -0.0008313539437949657, -0.0007636409136466682, -0.0006959278834983706, -0.0006282147951424122, -0.0005605017649941146, -0.0004927887348458171, -0.00042507570469751954, -0.00035736264544539154, -0.00028964958619326353, -0.00022193655604496598, -0.00015422352589666843, -8.651046664454043e-05, -1.8797407392412424e-05, 4.8915622755885124e-05, 0.0001166286674560979, 0.00018434171215631068, 0.0002520547714084387, 0.00031976780155673623, 0.0003874808317050338, 0.0004551938909571618, 0.0005229069502092898, 0.0005906199803575873]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 5.0, 5.0, 13.0, 6.0, 17.0, 16.0, 21.0, 22.0, 17.0, 22.0, 33.0, 24.0, 27.0, 34.0, 37.0, 39.0, 34.0, 33.0, 38.0, 38.0, 37.0, 39.0, 38.0, 41.0, 38.0, 34.0, 23.0, 27.0, 28.0, 28.0, 30.0, 22.0, 14.0, 15.0, 20.0, 17.0, 12.0, 19.0, 4.0, 12.0, 5.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0002879500389099121, -0.00027918070554733276, -0.0002704113721847534, -0.00026164203882217407, -0.0002528727054595947, -0.00024410337209701538, -0.00023533403873443604, -0.0002265647053718567, -0.00021779537200927734, -0.000209026038646698, -0.00020025670528411865, -0.0001914873719215393, -0.00018271803855895996, -0.00017394870519638062, -0.00016517937183380127, -0.00015641003847122192, -0.00014764070510864258, -0.00013887137174606323, -0.0001301020383834839, -0.00012133270502090454, -0.0001125633716583252, -0.00010379403829574585, -9.50247049331665e-05, -8.625537157058716e-05, -7.748603820800781e-05, -6.871670484542847e-05, -5.994737148284912e-05, -5.1178038120269775e-05, -4.240870475769043e-05, -3.3639371395111084e-05, -2.4870038032531738e-05, -1.6100704669952393e-05, -7.331371307373047e-06, 1.4379620552062988e-06, 1.0207295417785645e-05, 1.897662878036499e-05, 2.7745962142944336e-05, 3.651529550552368e-05, 4.528462886810303e-05, 5.405396223068237e-05, 6.282329559326172e-05, 7.159262895584106e-05, 8.036196231842041e-05, 8.913129568099976e-05, 9.79006290435791e-05, 0.00010666996240615845, 0.00011543929576873779, 0.00012420862913131714, 0.00013297796249389648, 0.00014174729585647583, 0.00015051662921905518, 0.00015928596258163452, 0.00016805529594421387, 0.0001768246293067932, 0.00018559396266937256, 0.0001943632960319519, 0.00020313262939453125, 0.0002119019627571106, 0.00022067129611968994, 0.0002294406294822693, 0.00023820996284484863, 0.000246979296207428, 0.0002557486295700073, 0.00026451796293258667, 0.000273287296295166]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 13.0, 11.0, 14.0, 13.0, 14.0, 18.0, 23.0, 24.0, 25.0, 31.0, 22.0, 36.0, 30.0, 35.0, 44.0, 43.0, 44.0, 45.0, 42.0, 41.0, 38.0, 35.0, 30.0, 44.0, 42.0, 32.0, 23.0, 21.0, 20.0, 15.0, 24.0, 16.0, 22.0, 10.0, 12.0, 13.0, 5.0, 9.0, 7.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.22540283203125, -5.0523681640625, -4.87933349609375, -4.706298828125, -4.53326416015625, -4.3602294921875, -4.18719482421875, -4.01416015625, -3.84112548828125, -3.6680908203125, -3.49505615234375, -3.322021484375, -3.14898681640625, -2.9759521484375, -2.80291748046875, -2.6298828125, -2.45684814453125, -2.2838134765625, -2.11077880859375, -1.937744140625, -1.76470947265625, -1.5916748046875, -1.41864013671875, -1.24560546875, -1.07257080078125, -0.8995361328125, -0.72650146484375, -0.553466796875, -0.38043212890625, -0.2073974609375, -0.03436279296875, 0.138671875, 0.31170654296875, 0.4847412109375, 0.65777587890625, 0.830810546875, 1.00384521484375, 1.1768798828125, 1.34991455078125, 1.52294921875, 1.69598388671875, 1.8690185546875, 2.04205322265625, 2.215087890625, 2.38812255859375, 2.5611572265625, 2.73419189453125, 2.9072265625, 3.08026123046875, 3.2532958984375, 3.42633056640625, 3.599365234375, 3.77239990234375, 3.9454345703125, 4.11846923828125, 4.29150390625, 4.46453857421875, 4.6375732421875, 4.81060791015625, 4.983642578125, 5.15667724609375, 5.3297119140625, 5.50274658203125, 5.67578125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 4.0, 3.0, 8.0, 6.0, 10.0, 14.0, 23.0, 28.0, 33.0, 54.0, 81.0, 106.0, 167.0, 250.0, 350.0, 576.0, 899.0, 1565.0, 2750.0, 5225.0, 9628.0, 18820.0, 37162.0, 75622.0, 162938.0, 308196.0, 222867.0, 100393.0, 48538.0, 24257.0, 12651.0, 6676.0, 3507.0, 1942.0, 1124.0, 742.0, 434.0, 255.0, 195.0, 120.0, 85.0, 73.0, 42.0, 36.0, 38.0, 19.0, 18.0, 10.0, 5.0, 3.0, 5.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.3984375, -3.29449462890625, -3.1905517578125, -3.08660888671875, -2.982666015625, -2.87872314453125, -2.7747802734375, -2.67083740234375, -2.56689453125, -2.46295166015625, -2.3590087890625, -2.25506591796875, -2.151123046875, -2.04718017578125, -1.9432373046875, -1.83929443359375, -1.7353515625, -1.63140869140625, -1.5274658203125, -1.42352294921875, -1.319580078125, -1.21563720703125, -1.1116943359375, -1.00775146484375, -0.90380859375, -0.79986572265625, -0.6959228515625, -0.59197998046875, -0.488037109375, -0.38409423828125, -0.2801513671875, -0.17620849609375, -0.072265625, 0.03167724609375, 0.1356201171875, 0.23956298828125, 0.343505859375, 0.44744873046875, 0.5513916015625, 0.65533447265625, 0.75927734375, 0.86322021484375, 0.9671630859375, 1.07110595703125, 1.175048828125, 1.27899169921875, 1.3829345703125, 1.48687744140625, 1.5908203125, 1.69476318359375, 1.7987060546875, 1.90264892578125, 2.006591796875, 2.11053466796875, 2.2144775390625, 2.31842041015625, 2.42236328125, 2.52630615234375, 2.6302490234375, 2.73419189453125, 2.838134765625, 2.94207763671875, 3.0460205078125, 3.14996337890625, 3.25390625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 4.0, 5.0, 5.0, 10.0, 17.0, 11.0, 18.0, 21.0, 18.0, 25.0, 31.0, 31.0, 35.0, 42.0, 55.0, 61.0, 82.0, 172.0, 1560.0, 298.0, 138.0, 63.0, 47.0, 49.0, 45.0, 35.0, 34.0, 35.0, 14.0, 12.0, 11.0, 11.0, 9.0, 8.0, 6.0, 8.0, 6.0, 4.0, 6.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.9375, -24.219970703125, -23.50244140625, -22.784912109375, -22.0673828125, -21.349853515625, -20.63232421875, -19.914794921875, -19.197265625, -18.479736328125, -17.76220703125, -17.044677734375, -16.3271484375, -15.609619140625, -14.89208984375, -14.174560546875, -13.45703125, -12.739501953125, -12.02197265625, -11.304443359375, -10.5869140625, -9.869384765625, -9.15185546875, -8.434326171875, -7.716796875, -6.999267578125, -6.28173828125, -5.564208984375, -4.8466796875, -4.129150390625, -3.41162109375, -2.694091796875, -1.9765625, -1.259033203125, -0.54150390625, 0.176025390625, 0.8935546875, 1.611083984375, 2.32861328125, 3.046142578125, 3.763671875, 4.481201171875, 5.19873046875, 5.916259765625, 6.6337890625, 7.351318359375, 8.06884765625, 8.786376953125, 9.50390625, 10.221435546875, 10.93896484375, 11.656494140625, 12.3740234375, 13.091552734375, 13.80908203125, 14.526611328125, 15.244140625, 15.961669921875, 16.67919921875, 17.396728515625, 18.1142578125, 18.831787109375, 19.54931640625, 20.266845703125, 20.984375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 4.0, 10.0, 11.0, 6.0, 16.0, 13.0, 19.0, 24.0, 32.0, 50.0, 82.0, 103.0, 123.0, 165.0, 223.0, 382.0, 864.0, 7727.0, 3083361.0, 49639.0, 1279.0, 466.0, 280.0, 184.0, 168.0, 106.0, 82.0, 73.0, 47.0, 34.0, 33.0, 22.0, 16.0, 11.0, 8.0, 8.0, 9.0, 1.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.75, -44.154296875, -42.55859375, -40.962890625, -39.3671875, -37.771484375, -36.17578125, -34.580078125, -32.984375, -31.388671875, -29.79296875, -28.197265625, -26.6015625, -25.005859375, -23.41015625, -21.814453125, -20.21875, -18.623046875, -17.02734375, -15.431640625, -13.8359375, -12.240234375, -10.64453125, -9.048828125, -7.453125, -5.857421875, -4.26171875, -2.666015625, -1.0703125, 0.525390625, 2.12109375, 3.716796875, 5.3125, 6.908203125, 8.50390625, 10.099609375, 11.6953125, 13.291015625, 14.88671875, 16.482421875, 18.078125, 19.673828125, 21.26953125, 22.865234375, 24.4609375, 26.056640625, 27.65234375, 29.248046875, 30.84375, 32.439453125, 34.03515625, 35.630859375, 37.2265625, 38.822265625, 40.41796875, 42.013671875, 43.609375, 45.205078125, 46.80078125, 48.396484375, 49.9921875, 51.587890625, 53.18359375, 54.779296875, 56.375]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 22.0, 512.0, 451.0, 27.0, 3.0, 0.0, 1.0], "bins": [-250.46109008789062, -246.2123565673828, -241.96360778808594, -237.71487426757812, -233.4661407470703, -229.2174072265625, -224.96865844726562, -220.7199249267578, -216.47119140625, -212.2224578857422, -207.9737091064453, -203.7249755859375, -199.4762420654297, -195.22750854492188, -190.978759765625, -186.7300262451172, -182.48129272460938, -178.23255920410156, -173.9838104248047, -169.73507690429688, -165.48634338378906, -161.23760986328125, -156.98886108398438, -152.74012756347656, -148.4913787841797, -144.24264526367188, -139.993896484375, -135.7451629638672, -131.49642944335938, -127.24768829345703, -122.99894714355469, -118.75021362304688, -114.50146484375, -110.25272369384766, -106.00399017333984, -101.7552490234375, -97.50651550292969, -93.25777435302734, -89.009033203125, -84.76029968261719, -80.51156616210938, -76.26282501220703, -72.01409149169922, -67.76535034179688, -63.51661682128906, -59.26787567138672, -55.01913833618164, -50.77040100097656, -46.52165985107422, -42.27292251586914, -38.02418518066406, -33.77544403076172, -29.526708602905273, -25.277971267700195, -21.029232025146484, -16.780494689941406, -12.531759262084961, -8.283021926879883, -4.034283638000488, 0.21445465087890625, 4.463191986083984, 8.711929321289062, 12.960668563842773, 17.20940589904785, 21.45814323425293]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 8.0, 6.0, 14.0, 10.0, 16.0, 7.0, 16.0, 23.0, 25.0, 29.0, 28.0, 31.0, 35.0, 39.0, 43.0, 40.0, 43.0, 36.0, 48.0, 34.0, 56.0, 44.0, 40.0, 30.0, 34.0, 36.0, 28.0, 37.0, 30.0, 23.0, 16.0, 19.0, 12.0, 10.0, 11.0, 9.0, 5.0, 8.0, 10.0, 6.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.542022705078125, -43.97051239013672, -42.39900588989258, -40.82749557495117, -39.25598907470703, -37.684478759765625, -36.11296844482422, -34.54146194458008, -32.96995544433594, -31.398447036743164, -29.82693862915039, -28.255428314208984, -26.683921813964844, -25.112411499023438, -23.540903091430664, -21.96939468383789, -20.397884368896484, -18.82637596130371, -17.254867553710938, -15.683358192443848, -14.111849784851074, -12.5403413772583, -10.968832015991211, -9.397323608398438, -7.825815200805664, -6.254306793212891, -4.682797908782959, -3.1112890243530273, -1.539780616760254, 0.03172779083251953, 1.6032371520996094, 3.174745559692383, 4.746250152587891, 6.317758560180664, 7.889267444610596, 9.460776329040527, 11.0322847366333, 12.603793144226074, 14.175302505493164, 15.746810913085938, 17.31831932067871, 18.889827728271484, 20.461336135864258, 22.03284454345703, 23.604354858398438, 25.175861358642578, 26.747371673583984, 28.318880081176758, 29.89038848876953, 31.461896896362305, 33.03340530395508, 34.604915618896484, 36.176422119140625, 37.74793243408203, 39.31944274902344, 40.89094924926758, 42.46245574951172, 44.033966064453125, 45.605472564697266, 47.17698287963867, 48.74848937988281, 50.31999969482422, 51.891510009765625, 53.463016510009766, 55.03452682495117]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 10.0, 12.0, 6.0, 21.0, 12.0, 16.0, 18.0, 30.0, 20.0, 23.0, 26.0, 27.0, 36.0, 30.0, 54.0, 36.0, 36.0, 30.0, 56.0, 47.0, 42.0, 42.0, 39.0, 26.0, 40.0, 34.0, 25.0, 31.0, 13.0, 22.0, 24.0, 20.0, 19.0, 18.0, 10.0, 11.0, 12.0, 8.0, 5.0, 7.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.44921875, -5.266845703125, -5.08447265625, -4.902099609375, -4.7197265625, -4.537353515625, -4.35498046875, -4.172607421875, -3.990234375, -3.807861328125, -3.62548828125, -3.443115234375, -3.2607421875, -3.078369140625, -2.89599609375, -2.713623046875, -2.53125, -2.348876953125, -2.16650390625, -1.984130859375, -1.8017578125, -1.619384765625, -1.43701171875, -1.254638671875, -1.072265625, -0.889892578125, -0.70751953125, -0.525146484375, -0.3427734375, -0.160400390625, 0.02197265625, 0.204345703125, 0.38671875, 0.569091796875, 0.75146484375, 0.933837890625, 1.1162109375, 1.298583984375, 1.48095703125, 1.663330078125, 1.845703125, 2.028076171875, 2.21044921875, 2.392822265625, 2.5751953125, 2.757568359375, 2.93994140625, 3.122314453125, 3.3046875, 3.487060546875, 3.66943359375, 3.851806640625, 4.0341796875, 4.216552734375, 4.39892578125, 4.581298828125, 4.763671875, 4.946044921875, 5.12841796875, 5.310791015625, 5.4931640625, 5.675537109375, 5.85791015625, 6.040283203125, 6.22265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 9.0, 14.0, 17.0, 18.0, 16.0, 19.0, 25.0, 25.0, 30.0, 41.0, 49.0, 99.0, 163.0, 290.0, 1466.0, 20152.0, 2035350.0, 2112666.0, 21376.0, 1575.0, 343.0, 173.0, 76.0, 53.0, 34.0, 37.0, 16.0, 31.0, 24.0, 20.0, 7.0, 14.0, 16.0, 14.0, 8.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.328125, -23.517333984375, -22.70654296875, -21.895751953125, -21.0849609375, -20.274169921875, -19.46337890625, -18.652587890625, -17.841796875, -17.031005859375, -16.22021484375, -15.409423828125, -14.5986328125, -13.787841796875, -12.97705078125, -12.166259765625, -11.35546875, -10.544677734375, -9.73388671875, -8.923095703125, -8.1123046875, -7.301513671875, -6.49072265625, -5.679931640625, -4.869140625, -4.058349609375, -3.24755859375, -2.436767578125, -1.6259765625, -0.815185546875, -0.00439453125, 0.806396484375, 1.6171875, 2.427978515625, 3.23876953125, 4.049560546875, 4.8603515625, 5.671142578125, 6.48193359375, 7.292724609375, 8.103515625, 8.914306640625, 9.72509765625, 10.535888671875, 11.3466796875, 12.157470703125, 12.96826171875, 13.779052734375, 14.58984375, 15.400634765625, 16.21142578125, 17.022216796875, 17.8330078125, 18.643798828125, 19.45458984375, 20.265380859375, 21.076171875, 21.886962890625, 22.69775390625, 23.508544921875, 24.3193359375, 25.130126953125, 25.94091796875, 26.751708984375, 27.5625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 7.0, 5.0, 7.0, 6.0, 5.0, 16.0, 6.0, 22.0, 20.0, 31.0, 38.0, 53.0, 67.0, 91.0, 119.0, 152.0, 184.0, 256.0, 316.0, 351.0, 406.0, 368.0, 344.0, 292.0, 219.0, 173.0, 106.0, 93.0, 57.0, 58.0, 56.0, 33.0, 31.0, 23.0, 18.0, 10.0, 6.0, 10.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0], "bins": [-11.90625, -11.5731201171875, -11.239990234375, -10.9068603515625, -10.57373046875, -10.2406005859375, -9.907470703125, -9.5743408203125, -9.2412109375, -8.9080810546875, -8.574951171875, -8.2418212890625, -7.90869140625, -7.5755615234375, -7.242431640625, -6.9093017578125, -6.576171875, -6.2430419921875, -5.909912109375, -5.5767822265625, -5.24365234375, -4.9105224609375, -4.577392578125, -4.2442626953125, -3.9111328125, -3.5780029296875, -3.244873046875, -2.9117431640625, -2.57861328125, -2.2454833984375, -1.912353515625, -1.5792236328125, -1.24609375, -0.9129638671875, -0.579833984375, -0.2467041015625, 0.08642578125, 0.4195556640625, 0.752685546875, 1.0858154296875, 1.4189453125, 1.7520751953125, 2.085205078125, 2.4183349609375, 2.75146484375, 3.0845947265625, 3.417724609375, 3.7508544921875, 4.083984375, 4.4171142578125, 4.750244140625, 5.0833740234375, 5.41650390625, 5.7496337890625, 6.082763671875, 6.4158935546875, 6.7490234375, 7.0821533203125, 7.415283203125, 7.7484130859375, 8.08154296875, 8.4146728515625, 8.747802734375, 9.0809326171875, 9.4140625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 10.0, 19.0, 7.0, 12.0, 13.0, 38.0, 38.0, 40.0, 67.0, 76.0, 99.0, 122.0, 160.0, 271.0, 519.0, 1620.0, 27074.0, 3866356.0, 291877.0, 3796.0, 790.0, 372.0, 244.0, 161.0, 92.0, 85.0, 63.0, 43.0, 43.0, 38.0, 28.0, 23.0, 11.0, 12.0, 10.0, 5.0, 5.0, 1.0, 11.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-53.03125, -51.54638671875, -50.0615234375, -48.57666015625, -47.091796875, -45.60693359375, -44.1220703125, -42.63720703125, -41.15234375, -39.66748046875, -38.1826171875, -36.69775390625, -35.212890625, -33.72802734375, -32.2431640625, -30.75830078125, -29.2734375, -27.78857421875, -26.3037109375, -24.81884765625, -23.333984375, -21.84912109375, -20.3642578125, -18.87939453125, -17.39453125, -15.90966796875, -14.4248046875, -12.93994140625, -11.455078125, -9.97021484375, -8.4853515625, -7.00048828125, -5.515625, -4.03076171875, -2.5458984375, -1.06103515625, 0.423828125, 1.90869140625, 3.3935546875, 4.87841796875, 6.36328125, 7.84814453125, 9.3330078125, 10.81787109375, 12.302734375, 13.78759765625, 15.2724609375, 16.75732421875, 18.2421875, 19.72705078125, 21.2119140625, 22.69677734375, 24.181640625, 25.66650390625, 27.1513671875, 28.63623046875, 30.12109375, 31.60595703125, 33.0908203125, 34.57568359375, 36.060546875, 37.54541015625, 39.0302734375, 40.51513671875, 42.0]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 44.0, 180.0, 344.0, 300.0, 109.0, 25.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.9864730834961, -122.07630920410156, -117.16614532470703, -112.2559814453125, -107.34581756591797, -102.43565368652344, -97.5254898071289, -92.61532592773438, -87.70516204833984, -82.79499816894531, -77.88483428955078, -72.97467041015625, -68.06450653076172, -63.15434265136719, -58.244178771972656, -53.334014892578125, -48.423851013183594, -43.51368713378906, -38.60352325439453, -33.693359375, -28.78319549560547, -23.873031616210938, -18.962867736816406, -14.052703857421875, -9.142539978027344, -4.2323760986328125, 0.6777877807617188, 5.58795166015625, 10.498115539550781, 15.408279418945312, 20.318443298339844, 25.228607177734375, 30.138778686523438, 35.04894256591797, 39.9591064453125, 44.86927032470703, 49.77943420410156, 54.689598083496094, 59.599761962890625, 64.50992584228516, 69.42008972167969, 74.33025360107422, 79.24041748046875, 84.15058135986328, 89.06074523925781, 93.97090911865234, 98.88107299804688, 103.7912368774414, 108.70140075683594, 113.61156463623047, 118.521728515625, 123.43189239501953, 128.34205627441406, 133.25222778320312, 138.16238403320312, 143.07254028320312, 147.9827117919922, 152.89288330078125, 157.80303955078125, 162.71319580078125, 167.6233673095703, 172.53353881835938, 177.44369506835938, 182.35385131835938, 187.26402282714844]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 0.0, 3.0, 6.0, 3.0, 4.0, 5.0, 4.0, 5.0, 10.0, 9.0, 13.0, 18.0, 16.0, 14.0, 15.0, 21.0, 20.0, 29.0, 21.0, 22.0, 41.0, 36.0, 25.0, 36.0, 37.0, 46.0, 35.0, 35.0, 36.0, 36.0, 42.0, 34.0, 27.0, 31.0, 33.0, 34.0, 19.0, 28.0, 27.0, 23.0, 14.0, 20.0, 11.0, 14.0, 11.0, 6.0, 8.0, 9.0, 4.0, 5.0, 3.0, 5.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.415283203125, -34.237327575683594, -33.05937194824219, -31.88141632080078, -30.703460693359375, -29.52550506591797, -28.347549438476562, -27.169593811035156, -25.99163818359375, -24.813682556152344, -23.635726928710938, -22.45777130126953, -21.279815673828125, -20.10186004638672, -18.923904418945312, -17.745948791503906, -16.5679931640625, -15.390037536621094, -14.212081909179688, -13.034126281738281, -11.856170654296875, -10.678215026855469, -9.500259399414062, -8.322303771972656, -7.14434814453125, -5.966392517089844, -4.7884368896484375, -3.6104812622070312, -2.432525634765625, -1.2545700073242188, -0.0766143798828125, 1.1013412475585938, 2.279296875, 3.4572525024414062, 4.6352081298828125, 5.813163757324219, 6.991119384765625, 8.169075012207031, 9.347030639648438, 10.524986267089844, 11.70294189453125, 12.880897521972656, 14.058853149414062, 15.236808776855469, 16.414764404296875, 17.59272003173828, 18.770675659179688, 19.948631286621094, 21.1265869140625, 22.304542541503906, 23.482498168945312, 24.66045379638672, 25.838409423828125, 27.01636505126953, 28.194320678710938, 29.372276306152344, 30.55023193359375, 31.728187561035156, 32.90614318847656, 34.08409881591797, 35.262054443359375, 36.44001007080078, 37.61796569824219, 38.795921325683594, 39.973876953125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 0.0, 6.0, 8.0, 10.0, 9.0, 13.0, 15.0, 25.0, 26.0, 31.0, 30.0, 39.0, 33.0, 41.0, 37.0, 48.0, 61.0, 57.0, 54.0, 42.0, 45.0, 36.0, 47.0, 50.0, 32.0, 34.0, 27.0, 26.0, 16.0, 28.0, 24.0, 22.0, 9.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19140625, -6.96893310546875, -6.7464599609375, -6.52398681640625, -6.301513671875, -6.07904052734375, -5.8565673828125, -5.63409423828125, -5.41162109375, -5.18914794921875, -4.9666748046875, -4.74420166015625, -4.521728515625, -4.29925537109375, -4.0767822265625, -3.85430908203125, -3.6318359375, -3.40936279296875, -3.1868896484375, -2.96441650390625, -2.741943359375, -2.51947021484375, -2.2969970703125, -2.07452392578125, -1.85205078125, -1.62957763671875, -1.4071044921875, -1.18463134765625, -0.962158203125, -0.73968505859375, -0.5172119140625, -0.29473876953125, -0.072265625, 0.15020751953125, 0.3726806640625, 0.59515380859375, 0.817626953125, 1.04010009765625, 1.2625732421875, 1.48504638671875, 1.70751953125, 1.92999267578125, 2.1524658203125, 2.37493896484375, 2.597412109375, 2.81988525390625, 3.0423583984375, 3.26483154296875, 3.4873046875, 3.70977783203125, 3.9322509765625, 4.15472412109375, 4.377197265625, 4.59967041015625, 4.8221435546875, 5.04461669921875, 5.26708984375, 5.48956298828125, 5.7120361328125, 5.93450927734375, 6.156982421875, 6.37945556640625, 6.6019287109375, 6.82440185546875, 7.046875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 9.0, 16.0, 16.0, 18.0, 32.0, 57.0, 75.0, 119.0, 176.0, 381.0, 518.0, 1025.0, 1769.0, 3005.0, 5265.0, 9160.0, 15294.0, 26638.0, 46903.0, 88349.0, 197935.0, 362878.0, 133620.0, 67531.0, 37018.0, 20901.0, 12704.0, 7417.0, 4176.0, 2367.0, 1349.0, 697.0, 463.0, 248.0, 165.0, 85.0, 60.0, 40.0, 21.0, 23.0, 19.0, 8.0, 1.0, 2.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5205078125, -1.473419189453125, -1.42633056640625, -1.379241943359375, -1.3321533203125, -1.285064697265625, -1.23797607421875, -1.190887451171875, -1.143798828125, -1.096710205078125, -1.04962158203125, -1.002532958984375, -0.9554443359375, -0.908355712890625, -0.86126708984375, -0.814178466796875, -0.76708984375, -0.720001220703125, -0.67291259765625, -0.625823974609375, -0.5787353515625, -0.531646728515625, -0.48455810546875, -0.437469482421875, -0.390380859375, -0.343292236328125, -0.29620361328125, -0.249114990234375, -0.2020263671875, -0.154937744140625, -0.10784912109375, -0.060760498046875, -0.013671875, 0.033416748046875, 0.08050537109375, 0.127593994140625, 0.1746826171875, 0.221771240234375, 0.26885986328125, 0.315948486328125, 0.363037109375, 0.410125732421875, 0.45721435546875, 0.504302978515625, 0.5513916015625, 0.598480224609375, 0.64556884765625, 0.692657470703125, 0.73974609375, 0.786834716796875, 0.83392333984375, 0.881011962890625, 0.9281005859375, 0.975189208984375, 1.02227783203125, 1.069366455078125, 1.116455078125, 1.163543701171875, 1.21063232421875, 1.257720947265625, 1.3048095703125, 1.351898193359375, 1.39898681640625, 1.446075439453125, 1.4931640625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 2.0, 8.0, 8.0, 8.0, 9.0, 8.0, 11.0, 12.0, 6.0, 10.0, 12.0, 17.0, 14.0, 24.0, 23.0, 30.0, 30.0, 37.0, 27.0, 34.0, 37.0, 45.0, 36.0, 37.0, 1071.0, 38.0, 34.0, 40.0, 37.0, 34.0, 23.0, 34.0, 33.0, 23.0, 17.0, 28.0, 20.0, 13.0, 9.0, 14.0, 18.0, 9.0, 7.0, 9.0, 12.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.926177978515625, -2.82110595703125, -2.716033935546875, -2.6109619140625, -2.505889892578125, -2.40081787109375, -2.295745849609375, -2.190673828125, -2.085601806640625, -1.98052978515625, -1.875457763671875, -1.7703857421875, -1.665313720703125, -1.56024169921875, -1.455169677734375, -1.35009765625, -1.245025634765625, -1.13995361328125, -1.034881591796875, -0.9298095703125, -0.824737548828125, -0.71966552734375, -0.614593505859375, -0.509521484375, -0.404449462890625, -0.29937744140625, -0.194305419921875, -0.0892333984375, 0.015838623046875, 0.12091064453125, 0.225982666015625, 0.3310546875, 0.436126708984375, 0.54119873046875, 0.646270751953125, 0.7513427734375, 0.856414794921875, 0.96148681640625, 1.066558837890625, 1.171630859375, 1.276702880859375, 1.38177490234375, 1.486846923828125, 1.5919189453125, 1.696990966796875, 1.80206298828125, 1.907135009765625, 2.01220703125, 2.117279052734375, 2.22235107421875, 2.327423095703125, 2.4324951171875, 2.537567138671875, 2.64263916015625, 2.747711181640625, 2.852783203125, 2.957855224609375, 3.06292724609375, 3.167999267578125, 3.2730712890625, 3.378143310546875, 3.48321533203125, 3.588287353515625, 3.693359375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 9.0, 13.0, 13.0, 9.0, 20.0, 32.0, 40.0, 79.0, 149.0, 277.0, 534.0, 900.0, 1604.0, 2659.0, 4665.0, 8404.0, 15360.0, 27520.0, 54574.0, 118461.0, 1430270.0, 247419.0, 89944.0, 42973.0, 22708.0, 12502.0, 6821.0, 3896.0, 2268.0, 1306.0, 761.0, 386.0, 224.0, 119.0, 60.0, 34.0, 24.0, 10.0, 14.0, 12.0, 10.0, 6.0, 13.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 3.0], "bins": [-1.763671875, -1.713043212890625, -1.66241455078125, -1.611785888671875, -1.5611572265625, -1.510528564453125, -1.45989990234375, -1.409271240234375, -1.358642578125, -1.308013916015625, -1.25738525390625, -1.206756591796875, -1.1561279296875, -1.105499267578125, -1.05487060546875, -1.004241943359375, -0.95361328125, -0.902984619140625, -0.85235595703125, -0.801727294921875, -0.7510986328125, -0.700469970703125, -0.64984130859375, -0.599212646484375, -0.548583984375, -0.497955322265625, -0.44732666015625, -0.396697998046875, -0.3460693359375, -0.295440673828125, -0.24481201171875, -0.194183349609375, -0.1435546875, -0.092926025390625, -0.04229736328125, 0.008331298828125, 0.0589599609375, 0.109588623046875, 0.16021728515625, 0.210845947265625, 0.261474609375, 0.312103271484375, 0.36273193359375, 0.413360595703125, 0.4639892578125, 0.514617919921875, 0.56524658203125, 0.615875244140625, 0.66650390625, 0.717132568359375, 0.76776123046875, 0.818389892578125, 0.8690185546875, 0.919647216796875, 0.97027587890625, 1.020904541015625, 1.071533203125, 1.122161865234375, 1.17279052734375, 1.223419189453125, 1.2740478515625, 1.324676513671875, 1.37530517578125, 1.425933837890625, 1.4765625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 8.0, 9.0, 8.0, 11.0, 4.0, 10.0, 23.0, 24.0, 26.0, 29.0, 41.0, 39.0, 65.0, 66.0, 60.0, 68.0, 74.0, 58.0, 57.0, 51.0, 39.0, 48.0, 23.0, 22.0, 23.0, 18.0, 17.0, 10.0, 11.0, 9.0, 15.0, 5.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.0007381439208984375, -0.0007134824991226196, -0.0006888210773468018, -0.0006641596555709839, -0.000639498233795166, -0.0006148368120193481, -0.0005901753902435303, -0.0005655139684677124, -0.0005408525466918945, -0.0005161911249160767, -0.0004915297031402588, -0.0004668682813644409, -0.00044220685958862305, -0.0004175454378128052, -0.0003928840160369873, -0.00036822259426116943, -0.00034356117248535156, -0.0003188997507095337, -0.0002942383289337158, -0.00026957690715789795, -0.0002449154853820801, -0.0002202540636062622, -0.00019559264183044434, -0.00017093122005462646, -0.0001462697982788086, -0.00012160837650299072, -9.694695472717285e-05, -7.228553295135498e-05, -4.762411117553711e-05, -2.2962689399719238e-05, 1.6987323760986328e-06, 2.6360154151916504e-05, 5.1021575927734375e-05, 7.568299770355225e-05, 0.00010034441947937012, 0.000125005841255188, 0.00014966726303100586, 0.00017432868480682373, 0.0001989901065826416, 0.00022365152835845947, 0.00024831295013427734, 0.0002729743719100952, 0.0002976357936859131, 0.00032229721546173096, 0.00034695863723754883, 0.0003716200590133667, 0.00039628148078918457, 0.00042094290256500244, 0.0004456043243408203, 0.0004702657461166382, 0.0004949271678924561, 0.0005195885896682739, 0.0005442500114440918, 0.0005689114332199097, 0.0005935728549957275, 0.0006182342767715454, 0.0006428956985473633, 0.0006675571203231812, 0.000692218542098999, 0.0007168799638748169, 0.0007415413856506348, 0.0007662028074264526, 0.0007908642292022705, 0.0008155256509780884, 0.0008401870727539062]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 4.0, 4.0, 6.0, 4.0, 8.0, 17.0, 7.0, 15.0, 18.0, 10.0, 24.0, 25.0, 53.0, 57.0, 62.0, 120.0, 211.0, 422.0, 1070.0, 61142.0, 980564.0, 3265.0, 663.0, 274.0, 139.0, 79.0, 73.0, 50.0, 37.0, 32.0, 17.0, 15.0, 13.0, 8.0, 7.0, 8.0, 5.0, 8.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.0199737548828125, -0.019437551498413086, -0.018901348114013672, -0.018365144729614258, -0.017828941345214844, -0.01729273796081543, -0.016756534576416016, -0.0162203311920166, -0.015684127807617188, -0.015147924423217773, -0.01461172103881836, -0.014075517654418945, -0.013539314270019531, -0.013003110885620117, -0.012466907501220703, -0.011930704116821289, -0.011394500732421875, -0.010858297348022461, -0.010322093963623047, -0.009785890579223633, -0.009249687194824219, -0.008713483810424805, -0.00817728042602539, -0.0076410770416259766, -0.0071048736572265625, -0.0065686702728271484, -0.006032466888427734, -0.00549626350402832, -0.004960060119628906, -0.004423856735229492, -0.003887653350830078, -0.003351449966430664, -0.00281524658203125, -0.002279043197631836, -0.0017428398132324219, -0.0012066364288330078, -0.0006704330444335938, -0.0001342296600341797, 0.0004019737243652344, 0.0009381771087646484, 0.0014743804931640625, 0.0020105838775634766, 0.0025467872619628906, 0.0030829906463623047, 0.0036191940307617188, 0.004155397415161133, 0.004691600799560547, 0.005227804183959961, 0.005764007568359375, 0.006300210952758789, 0.006836414337158203, 0.007372617721557617, 0.007908821105957031, 0.008445024490356445, 0.00898122787475586, 0.009517431259155273, 0.010053634643554688, 0.010589838027954102, 0.011126041412353516, 0.01166224479675293, 0.012198448181152344, 0.012734651565551758, 0.013270854949951172, 0.013807058334350586, 0.01434326171875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 8.0, 98.0, 553.0, 325.0, 32.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008777879411354661, -0.0007881181663833559, -0.0006984483334235847, -0.0006087785586714745, -0.0005191087257117033, -0.00042943895095959306, -0.0003397691762074828, -0.00025009934324771166, -0.00016042956849560142, -7.075977191561833e-05, 1.8910024664364755e-05, 0.00010857981396839023, 0.00019824961782433093, 0.0002879194216802716, 0.00037758919643238187, 0.000467259029392153, 0.0005569288041442633, 0.0006465985788963735, 0.0007362684118561447, 0.0008259381866082549, 0.0009156080195680261, 0.0010052777361124754, 0.0010949475690722466, 0.0011846174020320177, 0.0012742872349917889, 0.00136395706795156, 0.0014536267844960093, 0.0015432966174557805, 0.0016329664504155517, 0.001722636166960001, 0.0018123059999197721, 0.0019019758328795433, 0.0019916456658393145, 0.0020813154987990856, 0.0021709853317588568, 0.002260655164718628, 0.0023503247648477554, 0.0024399945978075266, 0.0025296644307672977, 0.002619334263727069, 0.00270900409668684, 0.002798673929646611, 0.0028883437626063824, 0.00297801336273551, 0.003067683195695281, 0.003157353028655052, 0.0032470228616148233, 0.0033366926945745945, 0.003426362294703722, 0.003516032127663493, 0.0036057019606232643, 0.003695371560752392, 0.003785041393712163, 0.003874711226671934, 0.003964381292462349, 0.0040540508925914764, 0.004143720958381891, 0.004233390558511019, 0.0043230606243014336, 0.004412730224430561, 0.004502400290220976, 0.004592069890350103, 0.004681739956140518, 0.004771409556269646, 0.004861079156398773]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 4.0, 9.0, 10.0, 9.0, 8.0, 7.0, 18.0, 23.0, 23.0, 20.0, 32.0, 30.0, 34.0, 33.0, 44.0, 33.0, 36.0, 47.0, 48.0, 50.0, 45.0, 37.0, 41.0, 41.0, 39.0, 40.0, 31.0, 32.0, 27.0, 24.0, 22.0, 19.0, 15.0, 11.0, 12.0, 7.0, 7.0, 7.0, 4.0, 4.0, 1.0, 1.0, 8.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003656744956970215, -0.00035262107849121094, -0.0003395676612854004, -0.00032651424407958984, -0.0003134608268737793, -0.00030040740966796875, -0.0002873539924621582, -0.00027430057525634766, -0.0002612471580505371, -0.00024819374084472656, -0.00023514032363891602, -0.00022208690643310547, -0.00020903348922729492, -0.00019598007202148438, -0.00018292665481567383, -0.00016987323760986328, -0.00015681982040405273, -0.0001437664031982422, -0.00013071298599243164, -0.0001176595687866211, -0.00010460615158081055, -9.1552734375e-05, -7.849931716918945e-05, -6.54458999633789e-05, -5.239248275756836e-05, -3.933906555175781e-05, -2.6285648345947266e-05, -1.3232231140136719e-05, -1.7881393432617188e-07, 1.2874603271484375e-05, 2.5928020477294922e-05, 3.898143768310547e-05, 5.2034854888916016e-05, 6.508827209472656e-05, 7.814168930053711e-05, 9.119510650634766e-05, 0.0001042485237121582, 0.00011730194091796875, 0.0001303553581237793, 0.00014340877532958984, 0.0001564621925354004, 0.00016951560974121094, 0.00018256902694702148, 0.00019562244415283203, 0.00020867586135864258, 0.00022172927856445312, 0.00023478269577026367, 0.0002478361129760742, 0.00026088953018188477, 0.0002739429473876953, 0.00028699636459350586, 0.0003000497817993164, 0.00031310319900512695, 0.0003261566162109375, 0.00033921003341674805, 0.0003522634506225586, 0.00036531686782836914, 0.0003783702850341797, 0.00039142370223999023, 0.0004044771194458008, 0.00041753053665161133, 0.0004305839538574219, 0.0004436373710632324, 0.00045669078826904297, 0.0004697442054748535]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 0.0, 6.0, 8.0, 10.0, 9.0, 13.0, 15.0, 25.0, 26.0, 31.0, 30.0, 39.0, 33.0, 41.0, 37.0, 48.0, 61.0, 57.0, 54.0, 42.0, 45.0, 36.0, 47.0, 50.0, 32.0, 34.0, 27.0, 26.0, 16.0, 28.0, 24.0, 22.0, 9.0, 10.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.19140625, -6.96893310546875, -6.7464599609375, -6.52398681640625, -6.301513671875, -6.07904052734375, -5.8565673828125, -5.63409423828125, -5.41162109375, -5.18914794921875, -4.9666748046875, -4.74420166015625, -4.521728515625, -4.29925537109375, -4.0767822265625, -3.85430908203125, -3.6318359375, -3.40936279296875, -3.1868896484375, -2.96441650390625, -2.741943359375, -2.51947021484375, -2.2969970703125, -2.07452392578125, -1.85205078125, -1.62957763671875, -1.4071044921875, -1.18463134765625, -0.962158203125, -0.73968505859375, -0.5172119140625, -0.29473876953125, -0.072265625, 0.15020751953125, 0.3726806640625, 0.59515380859375, 0.817626953125, 1.04010009765625, 1.2625732421875, 1.48504638671875, 1.70751953125, 1.92999267578125, 2.1524658203125, 2.37493896484375, 2.597412109375, 2.81988525390625, 3.0423583984375, 3.26483154296875, 3.4873046875, 3.70977783203125, 3.9322509765625, 4.15472412109375, 4.377197265625, 4.59967041015625, 4.8221435546875, 5.04461669921875, 5.26708984375, 5.48956298828125, 5.7120361328125, 5.93450927734375, 6.156982421875, 6.37945556640625, 6.6019287109375, 6.82440185546875, 7.046875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 9.0, 11.0, 7.0, 19.0, 34.0, 45.0, 65.0, 107.0, 177.0, 264.0, 408.0, 678.0, 1322.0, 3092.0, 9837.0, 48524.0, 316415.0, 557691.0, 85954.0, 15737.0, 4231.0, 1738.0, 859.0, 485.0, 279.0, 201.0, 125.0, 78.0, 59.0, 40.0, 20.0, 25.0, 7.0, 5.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.703125, -8.4324951171875, -8.161865234375, -7.8912353515625, -7.62060546875, -7.3499755859375, -7.079345703125, -6.8087158203125, -6.5380859375, -6.2674560546875, -5.996826171875, -5.7261962890625, -5.45556640625, -5.1849365234375, -4.914306640625, -4.6436767578125, -4.373046875, -4.1024169921875, -3.831787109375, -3.5611572265625, -3.29052734375, -3.0198974609375, -2.749267578125, -2.4786376953125, -2.2080078125, -1.9373779296875, -1.666748046875, -1.3961181640625, -1.12548828125, -0.8548583984375, -0.584228515625, -0.3135986328125, -0.04296875, 0.2276611328125, 0.498291015625, 0.7689208984375, 1.03955078125, 1.3101806640625, 1.580810546875, 1.8514404296875, 2.1220703125, 2.3927001953125, 2.663330078125, 2.9339599609375, 3.20458984375, 3.4752197265625, 3.745849609375, 4.0164794921875, 4.287109375, 4.5577392578125, 4.828369140625, 5.0989990234375, 5.36962890625, 5.6402587890625, 5.910888671875, 6.1815185546875, 6.4521484375, 6.7227783203125, 6.993408203125, 7.2640380859375, 7.53466796875, 7.8052978515625, 8.075927734375, 8.3465576171875, 8.6171875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 13.0, 2.0, 5.0, 9.0, 18.0, 14.0, 24.0, 17.0, 21.0, 35.0, 37.0, 47.0, 49.0, 53.0, 50.0, 66.0, 115.0, 1490.0, 417.0, 112.0, 71.0, 51.0, 44.0, 33.0, 48.0, 29.0, 27.0, 27.0, 12.0, 23.0, 20.0, 10.0, 14.0, 8.0, 6.0, 7.0, 4.0, 9.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.5, -18.848876953125, -18.19775390625, -17.546630859375, -16.8955078125, -16.244384765625, -15.59326171875, -14.942138671875, -14.291015625, -13.639892578125, -12.98876953125, -12.337646484375, -11.6865234375, -11.035400390625, -10.38427734375, -9.733154296875, -9.08203125, -8.430908203125, -7.77978515625, -7.128662109375, -6.4775390625, -5.826416015625, -5.17529296875, -4.524169921875, -3.873046875, -3.221923828125, -2.57080078125, -1.919677734375, -1.2685546875, -0.617431640625, 0.03369140625, 0.684814453125, 1.3359375, 1.987060546875, 2.63818359375, 3.289306640625, 3.9404296875, 4.591552734375, 5.24267578125, 5.893798828125, 6.544921875, 7.196044921875, 7.84716796875, 8.498291015625, 9.1494140625, 9.800537109375, 10.45166015625, 11.102783203125, 11.75390625, 12.405029296875, 13.05615234375, 13.707275390625, 14.3583984375, 15.009521484375, 15.66064453125, 16.311767578125, 16.962890625, 17.614013671875, 18.26513671875, 18.916259765625, 19.5673828125, 20.218505859375, 20.86962890625, 21.520751953125, 22.171875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 5.0, 11.0, 9.0, 11.0, 13.0, 27.0, 23.0, 39.0, 51.0, 71.0, 75.0, 117.0, 166.0, 229.0, 388.0, 915.0, 7227.0, 3084851.0, 48544.0, 1449.0, 501.0, 296.0, 159.0, 133.0, 101.0, 69.0, 50.0, 47.0, 37.0, 20.0, 21.0, 4.0, 13.0, 8.0, 7.0, 3.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.15625, -53.46826171875, -51.7802734375, -50.09228515625, -48.404296875, -46.71630859375, -45.0283203125, -43.34033203125, -41.65234375, -39.96435546875, -38.2763671875, -36.58837890625, -34.900390625, -33.21240234375, -31.5244140625, -29.83642578125, -28.1484375, -26.46044921875, -24.7724609375, -23.08447265625, -21.396484375, -19.70849609375, -18.0205078125, -16.33251953125, -14.64453125, -12.95654296875, -11.2685546875, -9.58056640625, -7.892578125, -6.20458984375, -4.5166015625, -2.82861328125, -1.140625, 0.54736328125, 2.2353515625, 3.92333984375, 5.611328125, 7.29931640625, 8.9873046875, 10.67529296875, 12.36328125, 14.05126953125, 15.7392578125, 17.42724609375, 19.115234375, 20.80322265625, 22.4912109375, 24.17919921875, 25.8671875, 27.55517578125, 29.2431640625, 30.93115234375, 32.619140625, 34.30712890625, 35.9951171875, 37.68310546875, 39.37109375, 41.05908203125, 42.7470703125, 44.43505859375, 46.123046875, 47.81103515625, 49.4990234375, 51.18701171875, 52.875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 19.0, 52.0, 104.0, 168.0, 208.0, 169.0, 145.0, 72.0, 33.0, 11.0, 6.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.83000946044922, -37.64575958251953, -36.461509704589844, -35.277259826660156, -34.09300994873047, -32.90876007080078, -31.724510192871094, -30.540260314941406, -29.35601043701172, -28.17176055908203, -26.987510681152344, -25.803260803222656, -24.61901092529297, -23.43476104736328, -22.250511169433594, -21.066261291503906, -19.88201141357422, -18.69776153564453, -17.513511657714844, -16.329261779785156, -15.145011901855469, -13.960762023925781, -12.776512145996094, -11.592262268066406, -10.408012390136719, -9.223762512207031, -8.039512634277344, -6.855262756347656, -5.671012878417969, -4.486763000488281, -3.3025131225585938, -2.1182632446289062, -0.9340095520019531, 0.2502403259277344, 1.4344902038574219, 2.6187400817871094, 3.802989959716797, 4.987239837646484, 6.171489715576172, 7.355739593505859, 8.539989471435547, 9.724239349365234, 10.908489227294922, 12.09273910522461, 13.276988983154297, 14.461238861083984, 15.645488739013672, 16.82973861694336, 18.013988494873047, 19.198238372802734, 20.382488250732422, 21.56673812866211, 22.750988006591797, 23.935237884521484, 25.119487762451172, 26.30373764038086, 27.487987518310547, 28.672237396240234, 29.856487274169922, 31.04073715209961, 32.2249870300293, 33.409236907958984, 34.59348678588867, 35.77773666381836, 36.96198654174805]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 2.0, 2.0, 12.0, 14.0, 17.0, 24.0, 24.0, 18.0, 30.0, 30.0, 35.0, 33.0, 41.0, 27.0, 35.0, 42.0, 43.0, 57.0, 42.0, 42.0, 47.0, 47.0, 40.0, 39.0, 33.0, 37.0, 35.0, 28.0, 20.0, 12.0, 13.0, 16.0, 7.0, 17.0, 9.0, 6.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.27732849121094, -60.255306243896484, -58.2332878112793, -56.211265563964844, -54.18924331665039, -52.16722106933594, -50.14520263671875, -48.1231803894043, -46.101158142089844, -44.07913589477539, -42.0571174621582, -40.03509521484375, -38.0130729675293, -35.991050720214844, -33.969032287597656, -31.947010040283203, -29.924991607666016, -27.902971267700195, -25.880949020385742, -23.858928680419922, -21.83690643310547, -19.81488609313965, -17.792865753173828, -15.770844459533691, -13.748823165893555, -11.726801872253418, -9.704780578613281, -7.682760238647461, -5.660738945007324, -3.6387176513671875, -1.6166973114013672, 0.40532398223876953, 2.4273452758789062, 4.449366569519043, 6.4713873863220215, 8.493408203125, 10.515429496765137, 12.537450790405273, 14.559471130371094, 16.581493377685547, 18.603513717651367, 20.625534057617188, 22.64755630493164, 24.66957664489746, 26.69159698486328, 28.713619232177734, 30.735639572143555, 32.757659912109375, 34.77968215942383, 36.80170440673828, 38.82372283935547, 40.84574508666992, 42.867767333984375, 44.88978576660156, 46.911808013916016, 48.93383026123047, 50.955848693847656, 52.97787094116211, 54.9998893737793, 57.02191162109375, 59.0439338684082, 61.065956115722656, 63.087974548339844, 65.10999298095703, 67.13201904296875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 6.0, 11.0, 6.0, 5.0, 8.0, 16.0, 28.0, 17.0, 23.0, 27.0, 34.0, 48.0, 42.0, 48.0, 36.0, 40.0, 51.0, 64.0, 47.0, 47.0, 36.0, 53.0, 46.0, 34.0, 29.0, 30.0, 24.0, 32.0, 21.0, 21.0, 26.0, 17.0, 10.0, 9.0, 4.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.53515625, -7.2987060546875, -7.062255859375, -6.8258056640625, -6.58935546875, -6.3529052734375, -6.116455078125, -5.8800048828125, -5.6435546875, -5.4071044921875, -5.170654296875, -4.9342041015625, -4.69775390625, -4.4613037109375, -4.224853515625, -3.9884033203125, -3.751953125, -3.5155029296875, -3.279052734375, -3.0426025390625, -2.80615234375, -2.5697021484375, -2.333251953125, -2.0968017578125, -1.8603515625, -1.6239013671875, -1.387451171875, -1.1510009765625, -0.91455078125, -0.6781005859375, -0.441650390625, -0.2052001953125, 0.03125, 0.2677001953125, 0.504150390625, 0.7406005859375, 0.97705078125, 1.2135009765625, 1.449951171875, 1.6864013671875, 1.9228515625, 2.1593017578125, 2.395751953125, 2.6322021484375, 2.86865234375, 3.1051025390625, 3.341552734375, 3.5780029296875, 3.814453125, 4.0509033203125, 4.287353515625, 4.5238037109375, 4.76025390625, 4.9967041015625, 5.233154296875, 5.4696044921875, 5.7060546875, 5.9425048828125, 6.178955078125, 6.4154052734375, 6.65185546875, 6.8883056640625, 7.124755859375, 7.3612060546875, 7.59765625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 10.0, 8.0, 9.0, 9.0, 16.0, 12.0, 29.0, 24.0, 25.0, 35.0, 32.0, 40.0, 66.0, 128.0, 377.0, 1740.0, 37688.0, 2991276.0, 1150348.0, 10756.0, 1024.0, 241.0, 85.0, 46.0, 41.0, 29.0, 24.0, 31.0, 16.0, 34.0, 25.0, 18.0, 10.0, 13.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.234375, -23.36376953125, -22.4931640625, -21.62255859375, -20.751953125, -19.88134765625, -19.0107421875, -18.14013671875, -17.26953125, -16.39892578125, -15.5283203125, -14.65771484375, -13.787109375, -12.91650390625, -12.0458984375, -11.17529296875, -10.3046875, -9.43408203125, -8.5634765625, -7.69287109375, -6.822265625, -5.95166015625, -5.0810546875, -4.21044921875, -3.33984375, -2.46923828125, -1.5986328125, -0.72802734375, 0.142578125, 1.01318359375, 1.8837890625, 2.75439453125, 3.625, 4.49560546875, 5.3662109375, 6.23681640625, 7.107421875, 7.97802734375, 8.8486328125, 9.71923828125, 10.58984375, 11.46044921875, 12.3310546875, 13.20166015625, 14.072265625, 14.94287109375, 15.8134765625, 16.68408203125, 17.5546875, 18.42529296875, 19.2958984375, 20.16650390625, 21.037109375, 21.90771484375, 22.7783203125, 23.64892578125, 24.51953125, 25.39013671875, 26.2607421875, 27.13134765625, 28.001953125, 28.87255859375, 29.7431640625, 30.61376953125, 31.484375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 10.0, 9.0, 13.0, 14.0, 26.0, 28.0, 37.0, 53.0, 79.0, 112.0, 183.0, 249.0, 352.0, 447.0, 525.0, 493.0, 411.0, 303.0, 225.0, 149.0, 98.0, 85.0, 55.0, 36.0, 23.0, 17.0, 11.0, 15.0, 5.0, 11.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.59375, -16.1317138671875, -15.669677734375, -15.2076416015625, -14.74560546875, -14.2835693359375, -13.821533203125, -13.3594970703125, -12.8974609375, -12.4354248046875, -11.973388671875, -11.5113525390625, -11.04931640625, -10.5872802734375, -10.125244140625, -9.6632080078125, -9.201171875, -8.7391357421875, -8.277099609375, -7.8150634765625, -7.35302734375, -6.8909912109375, -6.428955078125, -5.9669189453125, -5.5048828125, -5.0428466796875, -4.580810546875, -4.1187744140625, -3.65673828125, -3.1947021484375, -2.732666015625, -2.2706298828125, -1.80859375, -1.3465576171875, -0.884521484375, -0.4224853515625, 0.03955078125, 0.5015869140625, 0.963623046875, 1.4256591796875, 1.8876953125, 2.3497314453125, 2.811767578125, 3.2738037109375, 3.73583984375, 4.1978759765625, 4.659912109375, 5.1219482421875, 5.583984375, 6.0460205078125, 6.508056640625, 6.9700927734375, 7.43212890625, 7.8941650390625, 8.356201171875, 8.8182373046875, 9.2802734375, 9.7423095703125, 10.204345703125, 10.6663818359375, 11.12841796875, 11.5904541015625, 12.052490234375, 12.5145263671875, 12.9765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 8.0, 6.0, 8.0, 14.0, 19.0, 16.0, 32.0, 46.0, 47.0, 58.0, 79.0, 90.0, 115.0, 149.0, 221.0, 360.0, 550.0, 1943.0, 143641.0, 4017017.0, 26840.0, 1236.0, 524.0, 300.0, 238.0, 161.0, 140.0, 100.0, 76.0, 60.0, 44.0, 36.0, 32.0, 21.0, 19.0, 16.0, 7.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.46875, -45.794921875, -44.12109375, -42.447265625, -40.7734375, -39.099609375, -37.42578125, -35.751953125, -34.078125, -32.404296875, -30.73046875, -29.056640625, -27.3828125, -25.708984375, -24.03515625, -22.361328125, -20.6875, -19.013671875, -17.33984375, -15.666015625, -13.9921875, -12.318359375, -10.64453125, -8.970703125, -7.296875, -5.623046875, -3.94921875, -2.275390625, -0.6015625, 1.072265625, 2.74609375, 4.419921875, 6.09375, 7.767578125, 9.44140625, 11.115234375, 12.7890625, 14.462890625, 16.13671875, 17.810546875, 19.484375, 21.158203125, 22.83203125, 24.505859375, 26.1796875, 27.853515625, 29.52734375, 31.201171875, 32.875, 34.548828125, 36.22265625, 37.896484375, 39.5703125, 41.244140625, 42.91796875, 44.591796875, 46.265625, 47.939453125, 49.61328125, 51.287109375, 52.9609375, 54.634765625, 56.30859375, 57.982421875, 59.65625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 166.0, 555.0, 273.0, 16.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.591453552246094, -31.095874786376953, -22.600296020507812, -14.104717254638672, -5.609138488769531, 2.8864402770996094, 11.38201904296875, 19.87759780883789, 28.37317657470703, 36.86875534057617, 45.36433410644531, 53.85991287231445, 62.355491638183594, 70.85107421875, 79.34664916992188, 87.84222412109375, 96.33780670166016, 104.83338928222656, 113.32896423339844, 121.82453918457031, 130.32012939453125, 138.81570434570312, 147.311279296875, 155.80685424804688, 164.30242919921875, 172.79800415039062, 181.2935791015625, 189.78916931152344, 198.2847442626953, 206.7803192138672, 215.27590942382812, 223.771484375, 232.26705932617188, 240.76263427734375, 249.25820922851562, 257.7537841796875, 266.2493896484375, 274.7449645996094, 283.24053955078125, 291.7361145019531, 300.231689453125, 308.7272644042969, 317.22283935546875, 325.7184143066406, 334.2139892578125, 342.7095947265625, 351.2051696777344, 359.70074462890625, 368.1963195800781, 376.69189453125, 385.1874694824219, 393.68304443359375, 402.17864990234375, 410.6742248535156, 419.1697998046875, 427.6653747558594, 436.16094970703125, 444.6565246582031, 453.152099609375, 461.6476745605469, 470.14324951171875, 478.63885498046875, 487.1344299316406, 495.6300048828125, 504.1255798339844]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 3.0, 3.0, 0.0, 3.0, 4.0, 7.0, 4.0, 5.0, 10.0, 10.0, 12.0, 12.0, 13.0, 15.0, 19.0, 23.0, 19.0, 23.0, 17.0, 24.0, 28.0, 28.0, 39.0, 33.0, 33.0, 42.0, 42.0, 32.0, 26.0, 42.0, 43.0, 33.0, 30.0, 33.0, 42.0, 32.0, 30.0, 29.0, 26.0, 22.0, 17.0, 19.0, 17.0, 12.0, 13.0, 9.0, 7.0, 9.0, 2.0, 6.0, 8.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-34.30706787109375, -33.127113342285156, -31.94715690612793, -30.767202377319336, -29.58724594116211, -28.407291412353516, -27.227336883544922, -26.047382354736328, -24.8674259185791, -23.687471389770508, -22.50751495361328, -21.327560424804688, -20.147605895996094, -18.967649459838867, -17.787694931030273, -16.607738494873047, -15.427783966064453, -14.247828483581543, -13.067873001098633, -11.887918472290039, -10.707962989807129, -9.528007507324219, -8.348052978515625, -7.168097496032715, -5.988142013549805, -4.8081865310668945, -3.6282315254211426, -2.4482762813568115, -1.2683210372924805, -0.08836555480957031, 1.0915894508361816, 2.2715444564819336, 3.4514999389648438, 4.631455421447754, 5.811410427093506, 6.991365432739258, 8.171320915222168, 9.351276397705078, 10.531230926513672, 11.711186408996582, 12.891141891479492, 14.071097373962402, 15.251052856445312, 16.431007385253906, 17.6109619140625, 18.790918350219727, 19.97087287902832, 21.150829315185547, 22.33078384399414, 23.510738372802734, 24.69069480895996, 25.870649337768555, 27.05060577392578, 28.230560302734375, 29.41051483154297, 30.590469360351562, 31.77042579650879, 32.950382232666016, 34.13033676147461, 35.3102912902832, 36.4902458190918, 37.670204162597656, 38.85015869140625, 40.030113220214844, 41.21006774902344]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 3.0, 9.0, 7.0, 22.0, 15.0, 17.0, 25.0, 38.0, 35.0, 31.0, 49.0, 58.0, 48.0, 56.0, 56.0, 47.0, 45.0, 48.0, 63.0, 53.0, 48.0, 36.0, 35.0, 31.0, 26.0, 33.0, 17.0, 17.0, 9.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.578125, -10.31695556640625, -10.0557861328125, -9.79461669921875, -9.533447265625, -9.27227783203125, -9.0111083984375, -8.74993896484375, -8.48876953125, -8.22760009765625, -7.9664306640625, -7.70526123046875, -7.444091796875, -7.18292236328125, -6.9217529296875, -6.66058349609375, -6.3994140625, -6.13824462890625, -5.8770751953125, -5.61590576171875, -5.354736328125, -5.09356689453125, -4.8323974609375, -4.57122802734375, -4.31005859375, -4.04888916015625, -3.7877197265625, -3.52655029296875, -3.265380859375, -3.00421142578125, -2.7430419921875, -2.48187255859375, -2.220703125, -1.95953369140625, -1.6983642578125, -1.43719482421875, -1.176025390625, -0.91485595703125, -0.6536865234375, -0.39251708984375, -0.13134765625, 0.12982177734375, 0.3909912109375, 0.65216064453125, 0.913330078125, 1.17449951171875, 1.4356689453125, 1.69683837890625, 1.9580078125, 2.21917724609375, 2.4803466796875, 2.74151611328125, 3.002685546875, 3.26385498046875, 3.5250244140625, 3.78619384765625, 4.04736328125, 4.30853271484375, 4.5697021484375, 4.83087158203125, 5.092041015625, 5.35321044921875, 5.6143798828125, 5.87554931640625, 6.13671875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 1.0, 5.0, 10.0, 6.0, 11.0, 19.0, 21.0, 28.0, 49.0, 87.0, 154.0, 265.0, 460.0, 824.0, 1626.0, 3046.0, 6209.0, 12985.0, 27821.0, 62169.0, 161522.0, 460775.0, 183625.0, 68284.0, 30493.0, 14067.0, 6861.0, 3414.0, 1684.0, 889.0, 480.0, 238.0, 170.0, 89.0, 61.0, 41.0, 20.0, 16.0, 10.0, 8.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.083984375, -2.0179443359375, -1.951904296875, -1.8858642578125, -1.81982421875, -1.7537841796875, -1.687744140625, -1.6217041015625, -1.5556640625, -1.4896240234375, -1.423583984375, -1.3575439453125, -1.29150390625, -1.2254638671875, -1.159423828125, -1.0933837890625, -1.02734375, -0.9613037109375, -0.895263671875, -0.8292236328125, -0.76318359375, -0.6971435546875, -0.631103515625, -0.5650634765625, -0.4990234375, -0.4329833984375, -0.366943359375, -0.3009033203125, -0.23486328125, -0.1688232421875, -0.102783203125, -0.0367431640625, 0.029296875, 0.0953369140625, 0.161376953125, 0.2274169921875, 0.29345703125, 0.3594970703125, 0.425537109375, 0.4915771484375, 0.5576171875, 0.6236572265625, 0.689697265625, 0.7557373046875, 0.82177734375, 0.8878173828125, 0.953857421875, 1.0198974609375, 1.0859375, 1.1519775390625, 1.218017578125, 1.2840576171875, 1.35009765625, 1.4161376953125, 1.482177734375, 1.5482177734375, 1.6142578125, 1.6802978515625, 1.746337890625, 1.8123779296875, 1.87841796875, 1.9444580078125, 2.010498046875, 2.0765380859375, 2.142578125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 5.0, 6.0, 11.0, 12.0, 16.0, 18.0, 16.0, 20.0, 26.0, 30.0, 35.0, 26.0, 39.0, 32.0, 41.0, 33.0, 47.0, 46.0, 38.0, 1067.0, 49.0, 34.0, 47.0, 38.0, 35.0, 36.0, 25.0, 16.0, 27.0, 17.0, 23.0, 22.0, 13.0, 22.0, 8.0, 3.0, 12.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.8203125, -4.690185546875, -4.56005859375, -4.429931640625, -4.2998046875, -4.169677734375, -4.03955078125, -3.909423828125, -3.779296875, -3.649169921875, -3.51904296875, -3.388916015625, -3.2587890625, -3.128662109375, -2.99853515625, -2.868408203125, -2.73828125, -2.608154296875, -2.47802734375, -2.347900390625, -2.2177734375, -2.087646484375, -1.95751953125, -1.827392578125, -1.697265625, -1.567138671875, -1.43701171875, -1.306884765625, -1.1767578125, -1.046630859375, -0.91650390625, -0.786376953125, -0.65625, -0.526123046875, -0.39599609375, -0.265869140625, -0.1357421875, -0.005615234375, 0.12451171875, 0.254638671875, 0.384765625, 0.514892578125, 0.64501953125, 0.775146484375, 0.9052734375, 1.035400390625, 1.16552734375, 1.295654296875, 1.42578125, 1.555908203125, 1.68603515625, 1.816162109375, 1.9462890625, 2.076416015625, 2.20654296875, 2.336669921875, 2.466796875, 2.596923828125, 2.72705078125, 2.857177734375, 2.9873046875, 3.117431640625, 3.24755859375, 3.377685546875, 3.5078125]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 6.0, 0.0, 4.0, 4.0, 9.0, 12.0, 13.0, 17.0, 27.0, 47.0, 58.0, 116.0, 209.0, 395.0, 726.0, 1385.0, 2670.0, 5138.0, 10467.0, 20771.0, 42941.0, 95093.0, 304235.0, 1415417.0, 105405.0, 46664.0, 22459.0, 11191.0, 5686.0, 2791.0, 1478.0, 771.0, 411.0, 206.0, 120.0, 71.0, 30.0, 30.0, 13.0, 18.0, 5.0, 10.0, 8.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.732421875, -1.66839599609375, -1.6043701171875, -1.54034423828125, -1.476318359375, -1.41229248046875, -1.3482666015625, -1.28424072265625, -1.22021484375, -1.15618896484375, -1.0921630859375, -1.02813720703125, -0.964111328125, -0.90008544921875, -0.8360595703125, -0.77203369140625, -0.7080078125, -0.64398193359375, -0.5799560546875, -0.51593017578125, -0.451904296875, -0.38787841796875, -0.3238525390625, -0.25982666015625, -0.19580078125, -0.13177490234375, -0.0677490234375, -0.00372314453125, 0.060302734375, 0.12432861328125, 0.1883544921875, 0.25238037109375, 0.31640625, 0.38043212890625, 0.4444580078125, 0.50848388671875, 0.572509765625, 0.63653564453125, 0.7005615234375, 0.76458740234375, 0.82861328125, 0.89263916015625, 0.9566650390625, 1.02069091796875, 1.084716796875, 1.14874267578125, 1.2127685546875, 1.27679443359375, 1.3408203125, 1.40484619140625, 1.4688720703125, 1.53289794921875, 1.596923828125, 1.66094970703125, 1.7249755859375, 1.78900146484375, 1.85302734375, 1.91705322265625, 1.9810791015625, 2.04510498046875, 2.109130859375, 2.17315673828125, 2.2371826171875, 2.30120849609375, 2.365234375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 7.0, 5.0, 5.0, 7.0, 5.0, 10.0, 9.0, 14.0, 17.0, 28.0, 34.0, 39.0, 31.0, 58.0, 62.0, 79.0, 67.0, 81.0, 63.0, 72.0, 60.0, 51.0, 36.0, 29.0, 21.0, 23.0, 22.0, 9.0, 10.0, 7.0, 8.0, 6.0, 5.0, 6.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008630752563476562, -0.0008376613259315491, -0.0008122473955154419, -0.0007868334650993347, -0.0007614195346832275, -0.0007360056042671204, -0.0007105916738510132, -0.000685177743434906, -0.0006597638130187988, -0.0006343498826026917, -0.0006089359521865845, -0.0005835220217704773, -0.0005581080913543701, -0.0005326941609382629, -0.0005072802305221558, -0.0004818663001060486, -0.0004564523696899414, -0.00043103843927383423, -0.00040562450885772705, -0.0003802105784416199, -0.0003547966480255127, -0.0003293827176094055, -0.00030396878719329834, -0.00027855485677719116, -0.000253140926361084, -0.0002277269959449768, -0.00020231306552886963, -0.00017689913511276245, -0.00015148520469665527, -0.0001260712742805481, -0.00010065734386444092, -7.524341344833374e-05, -4.982948303222656e-05, -2.4415552616119385e-05, 9.98377799987793e-07, 2.641230821609497e-05, 5.182623863220215e-05, 7.724016904830933e-05, 0.0001026540994644165, 0.00012806802988052368, 0.00015348196029663086, 0.00017889589071273804, 0.00020430982112884521, 0.0002297237515449524, 0.00025513768196105957, 0.00028055161237716675, 0.0003059655427932739, 0.0003313794732093811, 0.0003567934036254883, 0.00038220733404159546, 0.00040762126445770264, 0.0004330351948738098, 0.000458449125289917, 0.00048386305570602417, 0.0005092769861221313, 0.0005346909165382385, 0.0005601048469543457, 0.0005855187773704529, 0.0006109327077865601, 0.0006363466382026672, 0.0006617605686187744, 0.0006871744990348816, 0.0007125884294509888, 0.000738002359867096, 0.0007634162902832031]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 12.0, 6.0, 6.0, 13.0, 18.0, 22.0, 35.0, 36.0, 44.0, 69.0, 101.0, 151.0, 310.0, 783.0, 29504.0, 1012354.0, 3894.0, 521.0, 212.0, 116.0, 85.0, 57.0, 40.0, 29.0, 29.0, 21.0, 13.0, 5.0, 12.0, 8.0, 11.0, 5.0, 5.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0170135498046875, -0.016452550888061523, -0.015891551971435547, -0.01533055305480957, -0.014769554138183594, -0.014208555221557617, -0.01364755630493164, -0.013086557388305664, -0.012525558471679688, -0.011964559555053711, -0.011403560638427734, -0.010842561721801758, -0.010281562805175781, -0.009720563888549805, -0.009159564971923828, -0.008598566055297852, -0.008037567138671875, -0.0074765682220458984, -0.006915569305419922, -0.006354570388793945, -0.005793571472167969, -0.005232572555541992, -0.004671573638916016, -0.004110574722290039, -0.0035495758056640625, -0.002988576889038086, -0.0024275779724121094, -0.0018665790557861328, -0.0013055801391601562, -0.0007445812225341797, -0.00018358230590820312, 0.00037741661071777344, 0.00093841552734375, 0.0014994144439697266, 0.002060413360595703, 0.0026214122772216797, 0.0031824111938476562, 0.003743410110473633, 0.004304409027099609, 0.004865407943725586, 0.0054264068603515625, 0.005987405776977539, 0.006548404693603516, 0.007109403610229492, 0.007670402526855469, 0.008231401443481445, 0.008792400360107422, 0.009353399276733398, 0.009914398193359375, 0.010475397109985352, 0.011036396026611328, 0.011597394943237305, 0.012158393859863281, 0.012719392776489258, 0.013280391693115234, 0.013841390609741211, 0.014402389526367188, 0.014963388442993164, 0.01552438735961914, 0.016085386276245117, 0.016646385192871094, 0.01720738410949707, 0.017768383026123047, 0.018329381942749023, 0.018890380859375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 14.0, 2.0, 17.0, 21.0, 29.0, 39.0, 51.0, 63.0, 80.0, 116.0, 82.0, 87.0, 84.0, 53.0, 82.0, 46.0, 45.0, 28.0, 25.0, 9.0, 14.0, 7.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00024530774680897593, -0.0002335798053536564, -0.0002218518638983369, -0.00021012392244301736, -0.0001983959664357826, -0.0001866680249804631, -0.00017494008352514356, -0.0001632121275179088, -0.0001514841860625893, -0.00013975624460726976, -0.00012802830315195024, -0.0001163003544206731, -0.00010457240568939596, -9.284446423407644e-05, -8.111652277875692e-05, -6.938857404747978e-05, -5.766063986811787e-05, -4.593269477481954e-05, -3.420474968152121e-05, -2.2476808226201683e-05, -1.0748863132903352e-05, 9.790819603949785e-07, 1.2707023415714502e-05, 2.443497214699164e-05, 3.6162913602311164e-05, 4.7890858695609495e-05, 5.9618803788907826e-05, 7.134674524422735e-05, 8.307468669954687e-05, 9.480263543082401e-05, 0.00010653057688614354, 0.00011825852561742067, 0.0001299864670727402, 0.00014171440852805972, 0.00015344234998337924, 0.00016517029143869877, 0.00017689824744593352, 0.00018862618890125304, 0.00020035413035657257, 0.00021208208636380732, 0.00022381002781912684, 0.00023553796927444637, 0.0002472659107297659, 0.0002589938521850854, 0.00027072179364040494, 0.0002824497641995549, 0.000294177676551044, 0.00030590564711019397, 0.00031763355946168303, 0.00032936150091700256, 0.0003410894423723221, 0.0003528173838276416, 0.00036454532528296113, 0.0003762732958421111, 0.0003880012081936002, 0.00039972917875275016, 0.0004114571202080697, 0.0004231850616633892, 0.00043491300311870873, 0.00044664094457402825, 0.0004583688860293478, 0.0004700968274846673, 0.0004818247980438173, 0.0004935527103953063, 0.0005052806809544563]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 8.0, 14.0, 8.0, 13.0, 10.0, 12.0, 15.0, 28.0, 18.0, 23.0, 26.0, 32.0, 34.0, 31.0, 45.0, 42.0, 31.0, 46.0, 40.0, 47.0, 48.0, 33.0, 45.0, 36.0, 39.0, 30.0, 28.0, 38.0, 26.0, 17.0, 24.0, 13.0, 19.0, 25.0, 18.0, 4.0, 5.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-0.00042068958282470703, -0.0004084687680006027, -0.0003962479531764984, -0.0003840271383523941, -0.0003718063235282898, -0.0003595855087041855, -0.0003473646938800812, -0.00033514387905597687, -0.00032292306423187256, -0.00031070224940776825, -0.00029848143458366394, -0.00028626061975955963, -0.0002740398049354553, -0.000261818990111351, -0.0002495981752872467, -0.0002373773604631424, -0.00022515654563903809, -0.00021293573081493378, -0.00020071491599082947, -0.00018849410116672516, -0.00017627328634262085, -0.00016405247151851654, -0.00015183165669441223, -0.00013961084187030792, -0.0001273900270462036, -0.0001151692122220993, -0.000102948397397995, -9.072758257389069e-05, -7.850676774978638e-05, -6.628595292568207e-05, -5.406513810157776e-05, -4.184432327747345e-05, -2.962350845336914e-05, -1.740269362926483e-05, -5.1818788051605225e-06, 7.038936018943787e-06, 1.9259750843048096e-05, 3.1480565667152405e-05, 4.3701380491256714e-05, 5.592219531536102e-05, 6.814301013946533e-05, 8.036382496356964e-05, 9.258463978767395e-05, 0.00010480545461177826, 0.00011702626943588257, 0.00012924708425998688, 0.0001414678990840912, 0.0001536887139081955, 0.0001659095287322998, 0.00017813034355640411, 0.00019035115838050842, 0.00020257197320461273, 0.00021479278802871704, 0.00022701360285282135, 0.00023923441767692566, 0.00025145523250102997, 0.0002636760473251343, 0.0002758968621492386, 0.0002881176769733429, 0.0003003384917974472, 0.0003125593066215515, 0.0003247801214456558, 0.00033700093626976013, 0.00034922175109386444, 0.00036144256591796875]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 7.0, 3.0, 9.0, 7.0, 22.0, 15.0, 17.0, 25.0, 38.0, 35.0, 31.0, 49.0, 58.0, 48.0, 56.0, 56.0, 47.0, 45.0, 48.0, 63.0, 53.0, 48.0, 36.0, 35.0, 31.0, 26.0, 33.0, 17.0, 17.0, 9.0, 9.0, 7.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.578125, -10.31695556640625, -10.0557861328125, -9.79461669921875, -9.533447265625, -9.27227783203125, -9.0111083984375, -8.74993896484375, -8.48876953125, -8.22760009765625, -7.9664306640625, -7.70526123046875, -7.444091796875, -7.18292236328125, -6.9217529296875, -6.66058349609375, -6.3994140625, -6.13824462890625, -5.8770751953125, -5.61590576171875, -5.354736328125, -5.09356689453125, -4.8323974609375, -4.57122802734375, -4.31005859375, -4.04888916015625, -3.7877197265625, -3.52655029296875, -3.265380859375, -3.00421142578125, -2.7430419921875, -2.48187255859375, -2.220703125, -1.95953369140625, -1.6983642578125, -1.43719482421875, -1.176025390625, -0.91485595703125, -0.6536865234375, -0.39251708984375, -0.13134765625, 0.12982177734375, 0.3909912109375, 0.65216064453125, 0.913330078125, 1.17449951171875, 1.4356689453125, 1.69683837890625, 1.9580078125, 2.21917724609375, 2.4803466796875, 2.74151611328125, 3.002685546875, 3.26385498046875, 3.5250244140625, 3.78619384765625, 4.04736328125, 4.30853271484375, 4.5697021484375, 4.83087158203125, 5.092041015625, 5.35321044921875, 5.6143798828125, 5.87554931640625, 6.13671875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 15.0, 20.0, 35.0, 64.0, 117.0, 229.0, 398.0, 817.0, 2018.0, 5466.0, 19058.0, 99717.0, 627293.0, 242277.0, 36449.0, 9141.0, 2999.0, 1216.0, 555.0, 308.0, 144.0, 92.0, 44.0, 23.0, 16.0, 15.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-10.875, -10.60791015625, -10.3408203125, -10.07373046875, -9.806640625, -9.53955078125, -9.2724609375, -9.00537109375, -8.73828125, -8.47119140625, -8.2041015625, -7.93701171875, -7.669921875, -7.40283203125, -7.1357421875, -6.86865234375, -6.6015625, -6.33447265625, -6.0673828125, -5.80029296875, -5.533203125, -5.26611328125, -4.9990234375, -4.73193359375, -4.46484375, -4.19775390625, -3.9306640625, -3.66357421875, -3.396484375, -3.12939453125, -2.8623046875, -2.59521484375, -2.328125, -2.06103515625, -1.7939453125, -1.52685546875, -1.259765625, -0.99267578125, -0.7255859375, -0.45849609375, -0.19140625, 0.07568359375, 0.3427734375, 0.60986328125, 0.876953125, 1.14404296875, 1.4111328125, 1.67822265625, 1.9453125, 2.21240234375, 2.4794921875, 2.74658203125, 3.013671875, 3.28076171875, 3.5478515625, 3.81494140625, 4.08203125, 4.34912109375, 4.6162109375, 4.88330078125, 5.150390625, 5.41748046875, 5.6845703125, 5.95166015625, 6.21875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 9.0, 9.0, 11.0, 16.0, 20.0, 29.0, 28.0, 26.0, 32.0, 34.0, 30.0, 36.0, 37.0, 72.0, 85.0, 219.0, 1650.0, 175.0, 69.0, 91.0, 54.0, 51.0, 37.0, 44.0, 20.0, 29.0, 26.0, 11.0, 16.0, 18.0, 13.0, 7.0, 9.0, 4.0, 12.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0], "bins": [-28.046875, -27.31689453125, -26.5869140625, -25.85693359375, -25.126953125, -24.39697265625, -23.6669921875, -22.93701171875, -22.20703125, -21.47705078125, -20.7470703125, -20.01708984375, -19.287109375, -18.55712890625, -17.8271484375, -17.09716796875, -16.3671875, -15.63720703125, -14.9072265625, -14.17724609375, -13.447265625, -12.71728515625, -11.9873046875, -11.25732421875, -10.52734375, -9.79736328125, -9.0673828125, -8.33740234375, -7.607421875, -6.87744140625, -6.1474609375, -5.41748046875, -4.6875, -3.95751953125, -3.2275390625, -2.49755859375, -1.767578125, -1.03759765625, -0.3076171875, 0.42236328125, 1.15234375, 1.88232421875, 2.6123046875, 3.34228515625, 4.072265625, 4.80224609375, 5.5322265625, 6.26220703125, 6.9921875, 7.72216796875, 8.4521484375, 9.18212890625, 9.912109375, 10.64208984375, 11.3720703125, 12.10205078125, 12.83203125, 13.56201171875, 14.2919921875, 15.02197265625, 15.751953125, 16.48193359375, 17.2119140625, 17.94189453125, 18.671875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 6.0, 7.0, 8.0, 16.0, 27.0, 43.0, 92.0, 124.0, 245.0, 512.0, 2251.0, 3135616.0, 5530.0, 561.0, 289.0, 164.0, 104.0, 40.0, 28.0, 19.0, 9.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-120.4375, -116.6259765625, -112.814453125, -109.0029296875, -105.19140625, -101.3798828125, -97.568359375, -93.7568359375, -89.9453125, -86.1337890625, -82.322265625, -78.5107421875, -74.69921875, -70.8876953125, -67.076171875, -63.2646484375, -59.453125, -55.6416015625, -51.830078125, -48.0185546875, -44.20703125, -40.3955078125, -36.583984375, -32.7724609375, -28.9609375, -25.1494140625, -21.337890625, -17.5263671875, -13.71484375, -9.9033203125, -6.091796875, -2.2802734375, 1.53125, 5.3427734375, 9.154296875, 12.9658203125, 16.77734375, 20.5888671875, 24.400390625, 28.2119140625, 32.0234375, 35.8349609375, 39.646484375, 43.4580078125, 47.26953125, 51.0810546875, 54.892578125, 58.7041015625, 62.515625, 66.3271484375, 70.138671875, 73.9501953125, 77.76171875, 81.5732421875, 85.384765625, 89.1962890625, 93.0078125, 96.8193359375, 100.630859375, 104.4423828125, 108.25390625, 112.0654296875, 115.876953125, 119.6884765625, 123.5]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 48.0, 963.0, 4.0, 2.0, 1.0], "bins": [-784.23779296875, -771.2250366210938, -758.2122802734375, -745.1995239257812, -732.186767578125, -719.1740112304688, -706.1612548828125, -693.1484375, -680.1357421875, -667.1229858398438, -654.1102294921875, -641.0974731445312, -628.084716796875, -615.0719604492188, -602.0592041015625, -589.04638671875, -576.0336303710938, -563.0208740234375, -550.0081176757812, -536.995361328125, -523.9826049804688, -510.9698486328125, -497.9570617675781, -484.9443054199219, -471.9315490722656, -458.9187927246094, -445.9060363769531, -432.8932800292969, -419.8804931640625, -406.86773681640625, -393.85498046875, -380.84222412109375, -367.8294372558594, -354.8166809082031, -341.8039245605469, -328.7911682128906, -315.77838134765625, -302.765625, -289.75286865234375, -276.7401123046875, -263.72735595703125, -250.714599609375, -237.70184326171875, -224.68907165527344, -211.6763153076172, -198.66355895996094, -185.65078735351562, -172.63803100585938, -159.6252899169922, -146.61253356933594, -133.59976196289062, -120.58700561523438, -107.57424926757812, -94.56149291992188, -81.5487289428711, -68.53596496582031, -55.5232048034668, -42.51044464111328, -29.497684478759766, -16.48492431640625, -3.4721641540527344, 9.540592193603516, 22.553356170654297, 35.56612014770508, 48.57887649536133]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 8.0, 13.0, 10.0, 16.0, 14.0, 21.0, 27.0, 20.0, 28.0, 24.0, 26.0, 44.0, 37.0, 35.0, 40.0, 32.0, 44.0, 41.0, 44.0, 46.0, 42.0, 40.0, 38.0, 29.0, 29.0, 36.0, 30.0, 19.0, 19.0, 24.0, 10.0, 17.0, 14.0, 13.0, 15.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.4766845703125, -52.66476821899414, -50.85285186767578, -49.04093551635742, -47.22901916503906, -45.41710662841797, -43.60519027709961, -41.79327392578125, -39.98135757446289, -38.16944122314453, -36.35752487182617, -34.54560852050781, -32.73369598388672, -30.921777725219727, -29.10986328125, -27.29794692993164, -25.48603057861328, -23.674114227294922, -21.862197875976562, -20.050283432006836, -18.238367080688477, -16.426450729370117, -14.614535331726074, -12.802619934082031, -10.990703582763672, -9.178787231445312, -7.3668718338012695, -5.554955959320068, -3.743040084838867, -1.9311237335205078, -0.11920833587646484, 1.6927070617675781, 3.504627227783203, 5.316543102264404, 7.1284589767456055, 8.940374374389648, 10.752290725708008, 12.564207077026367, 14.37612247467041, 16.188037872314453, 17.999954223632812, 19.811870574951172, 21.62378692626953, 23.435701370239258, 25.247617721557617, 27.059534072875977, 28.871448516845703, 30.683364868164062, 32.49528121948242, 34.30719757080078, 36.11911392211914, 37.9310302734375, 39.742942810058594, 41.55486297607422, 43.36677551269531, 45.17869186401367, 46.99060821533203, 48.80252456665039, 50.61444091796875, 52.42635726928711, 54.23827362060547, 56.05018615722656, 57.86210250854492, 59.67401885986328, 61.48593521118164]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 5.0, 7.0, 7.0, 12.0, 12.0, 10.0, 24.0, 25.0, 20.0, 32.0, 32.0, 35.0, 47.0, 65.0, 55.0, 46.0, 57.0, 46.0, 52.0, 49.0, 43.0, 50.0, 43.0, 40.0, 39.0, 31.0, 26.0, 33.0, 15.0, 9.0, 13.0, 12.0, 7.0, 3.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0], "bins": [-11.171875, -10.90118408203125, -10.6304931640625, -10.35980224609375, -10.089111328125, -9.81842041015625, -9.5477294921875, -9.27703857421875, -9.00634765625, -8.73565673828125, -8.4649658203125, -8.19427490234375, -7.923583984375, -7.65289306640625, -7.3822021484375, -7.11151123046875, -6.8408203125, -6.57012939453125, -6.2994384765625, -6.02874755859375, -5.758056640625, -5.48736572265625, -5.2166748046875, -4.94598388671875, -4.67529296875, -4.40460205078125, -4.1339111328125, -3.86322021484375, -3.592529296875, -3.32183837890625, -3.0511474609375, -2.78045654296875, -2.509765625, -2.23907470703125, -1.9683837890625, -1.69769287109375, -1.427001953125, -1.15631103515625, -0.8856201171875, -0.61492919921875, -0.34423828125, -0.07354736328125, 0.1971435546875, 0.46783447265625, 0.738525390625, 1.00921630859375, 1.2799072265625, 1.55059814453125, 1.8212890625, 2.09197998046875, 2.3626708984375, 2.63336181640625, 2.904052734375, 3.17474365234375, 3.4454345703125, 3.71612548828125, 3.98681640625, 4.25750732421875, 4.5281982421875, 4.79888916015625, 5.069580078125, 5.34027099609375, 5.6109619140625, 5.88165283203125, 6.15234375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 4.0, 6.0, 9.0, 14.0, 15.0, 18.0, 22.0, 24.0, 26.0, 43.0, 68.0, 97.0, 217.0, 399.0, 1393.0, 12276.0, 747857.0, 3279428.0, 145298.0, 5445.0, 853.0, 310.0, 155.0, 74.0, 51.0, 40.0, 48.0, 20.0, 20.0, 15.0, 12.0, 10.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-28.765625, -28.033935546875, -27.30224609375, -26.570556640625, -25.8388671875, -25.107177734375, -24.37548828125, -23.643798828125, -22.912109375, -22.180419921875, -21.44873046875, -20.717041015625, -19.9853515625, -19.253662109375, -18.52197265625, -17.790283203125, -17.05859375, -16.326904296875, -15.59521484375, -14.863525390625, -14.1318359375, -13.400146484375, -12.66845703125, -11.936767578125, -11.205078125, -10.473388671875, -9.74169921875, -9.010009765625, -8.2783203125, -7.546630859375, -6.81494140625, -6.083251953125, -5.3515625, -4.619873046875, -3.88818359375, -3.156494140625, -2.4248046875, -1.693115234375, -0.96142578125, -0.229736328125, 0.501953125, 1.233642578125, 1.96533203125, 2.697021484375, 3.4287109375, 4.160400390625, 4.89208984375, 5.623779296875, 6.35546875, 7.087158203125, 7.81884765625, 8.550537109375, 9.2822265625, 10.013916015625, 10.74560546875, 11.477294921875, 12.208984375, 12.940673828125, 13.67236328125, 14.404052734375, 15.1357421875, 15.867431640625, 16.59912109375, 17.330810546875, 18.0625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 11.0, 7.0, 18.0, 23.0, 42.0, 59.0, 117.0, 197.0, 250.0, 430.0, 572.0, 743.0, 551.0, 395.0, 236.0, 148.0, 98.0, 59.0, 37.0, 31.0, 23.0, 8.0, 6.0, 9.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.53125, -21.9447021484375, -21.358154296875, -20.7716064453125, -20.18505859375, -19.5985107421875, -19.011962890625, -18.4254150390625, -17.8388671875, -17.2523193359375, -16.665771484375, -16.0792236328125, -15.49267578125, -14.9061279296875, -14.319580078125, -13.7330322265625, -13.146484375, -12.5599365234375, -11.973388671875, -11.3868408203125, -10.80029296875, -10.2137451171875, -9.627197265625, -9.0406494140625, -8.4541015625, -7.8675537109375, -7.281005859375, -6.6944580078125, -6.10791015625, -5.5213623046875, -4.934814453125, -4.3482666015625, -3.76171875, -3.1751708984375, -2.588623046875, -2.0020751953125, -1.41552734375, -0.8289794921875, -0.242431640625, 0.3441162109375, 0.9306640625, 1.5172119140625, 2.103759765625, 2.6903076171875, 3.27685546875, 3.8634033203125, 4.449951171875, 5.0364990234375, 5.623046875, 6.2095947265625, 6.796142578125, 7.3826904296875, 7.96923828125, 8.5557861328125, 9.142333984375, 9.7288818359375, 10.3154296875, 10.9019775390625, 11.488525390625, 12.0750732421875, 12.66162109375, 13.2481689453125, 13.834716796875, 14.4212646484375, 15.0078125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 5.0, 11.0, 15.0, 22.0, 20.0, 27.0, 61.0, 73.0, 91.0, 106.0, 180.0, 230.0, 415.0, 874.0, 9015.0, 4085306.0, 94935.0, 1320.0, 524.0, 311.0, 211.0, 140.0, 111.0, 78.0, 50.0, 32.0, 35.0, 27.0, 11.0, 15.0, 7.0, 9.0, 5.0, 5.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.65625, -53.48876953125, -51.3212890625, -49.15380859375, -46.986328125, -44.81884765625, -42.6513671875, -40.48388671875, -38.31640625, -36.14892578125, -33.9814453125, -31.81396484375, -29.646484375, -27.47900390625, -25.3115234375, -23.14404296875, -20.9765625, -18.80908203125, -16.6416015625, -14.47412109375, -12.306640625, -10.13916015625, -7.9716796875, -5.80419921875, -3.63671875, -1.46923828125, 0.6982421875, 2.86572265625, 5.033203125, 7.20068359375, 9.3681640625, 11.53564453125, 13.703125, 15.87060546875, 18.0380859375, 20.20556640625, 22.373046875, 24.54052734375, 26.7080078125, 28.87548828125, 31.04296875, 33.21044921875, 35.3779296875, 37.54541015625, 39.712890625, 41.88037109375, 44.0478515625, 46.21533203125, 48.3828125, 50.55029296875, 52.7177734375, 54.88525390625, 57.052734375, 59.22021484375, 61.3876953125, 63.55517578125, 65.72265625, 67.89013671875, 70.0576171875, 72.22509765625, 74.392578125, 76.56005859375, 78.7275390625, 80.89501953125, 83.0625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 12.0, 10.0, 28.0, 42.0, 51.0, 57.0, 89.0, 112.0, 123.0, 119.0, 98.0, 101.0, 54.0, 39.0, 30.0, 17.0, 12.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.36921691894531, -32.85965347290039, -31.35009002685547, -29.840526580810547, -28.330963134765625, -26.821399688720703, -25.311838150024414, -23.802274703979492, -22.29271125793457, -20.78314781188965, -19.273584365844727, -17.764022827148438, -16.254459381103516, -14.744894981384277, -13.235332489013672, -11.72576904296875, -10.216205596923828, -8.706642150878906, -7.197079181671143, -5.687516212463379, -4.177952766418457, -2.668389320373535, -1.1588268280029297, 0.3507366180419922, 1.860300064086914, 3.369863271713257, 4.8794264793396, 6.388989448547363, 7.898552894592285, 9.408116340637207, 10.917678833007812, 12.427242279052734, 13.936809539794922, 15.446372985839844, 16.955936431884766, 18.465499877929688, 19.97506332397461, 21.48462677001953, 22.99418830871582, 24.503751754760742, 26.013315200805664, 27.522878646850586, 29.032442092895508, 30.542003631591797, 32.05156707763672, 33.56113052368164, 35.07069396972656, 36.580257415771484, 38.089820861816406, 39.59938430786133, 41.10894775390625, 42.61851119995117, 44.128074645996094, 45.637638092041016, 47.14720153808594, 48.656761169433594, 50.16632843017578, 51.6758918762207, 53.185455322265625, 54.69501876831055, 56.20458221435547, 57.71414566040039, 59.22370910644531, 60.73326873779297, 62.24283218383789]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 9.0, 6.0, 12.0, 14.0, 9.0, 14.0, 22.0, 24.0, 27.0, 17.0, 29.0, 27.0, 45.0, 41.0, 33.0, 34.0, 39.0, 43.0, 46.0, 43.0, 52.0, 37.0, 34.0, 41.0, 42.0, 35.0, 24.0, 25.0, 28.0, 19.0, 19.0, 18.0, 16.0, 11.0, 10.0, 13.0, 9.0, 10.0, 4.0, 9.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-47.97943115234375, -46.67707443237305, -45.374717712402344, -44.072364807128906, -42.7700080871582, -41.4676513671875, -40.1652946472168, -38.862937927246094, -37.560585021972656, -36.25822830200195, -34.95587158203125, -33.65351867675781, -32.35116195678711, -31.048805236816406, -29.746448516845703, -28.444093704223633, -27.14173698425293, -25.839380264282227, -24.537025451660156, -23.234668731689453, -21.932313919067383, -20.62995719909668, -19.32760238647461, -18.025245666503906, -16.722888946533203, -15.420533180236816, -14.11817741394043, -12.815820693969727, -11.513465881347656, -10.211109161376953, -8.908753395080566, -7.60639762878418, -6.304042816162109, -5.001687049865723, -3.699331045150757, -2.396975040435791, -1.0946192741394043, 0.20773649215698242, 1.5100927352905273, 2.812448501586914, 4.114804267883301, 5.4171600341796875, 6.719515800476074, 8.021871566772461, 9.324228286743164, 10.626583099365234, 11.928939819335938, 13.231295585632324, 14.533651351928711, 15.836007118225098, 17.138362884521484, 18.440719604492188, 19.743074417114258, 21.04543113708496, 22.34778594970703, 23.650142669677734, 24.952499389648438, 26.25485610961914, 27.55721092224121, 28.859567642211914, 30.161922454833984, 31.464279174804688, 32.76663589477539, 34.068992614746094, 35.37134552001953]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 7.0, 5.0, 9.0, 5.0, 10.0, 21.0, 11.0, 25.0, 20.0, 14.0, 34.0, 36.0, 50.0, 43.0, 64.0, 47.0, 39.0, 44.0, 61.0, 52.0, 56.0, 40.0, 48.0, 38.0, 41.0, 39.0, 23.0, 24.0, 22.0, 30.0, 18.0, 11.0, 8.0, 1.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.59954833984375, -9.3475341796875, -9.09552001953125, -8.843505859375, -8.59149169921875, -8.3394775390625, -8.08746337890625, -7.83544921875, -7.58343505859375, -7.3314208984375, -7.07940673828125, -6.827392578125, -6.57537841796875, -6.3233642578125, -6.07135009765625, -5.8193359375, -5.56732177734375, -5.3153076171875, -5.06329345703125, -4.811279296875, -4.55926513671875, -4.3072509765625, -4.05523681640625, -3.80322265625, -3.55120849609375, -3.2991943359375, -3.04718017578125, -2.795166015625, -2.54315185546875, -2.2911376953125, -2.03912353515625, -1.787109375, -1.53509521484375, -1.2830810546875, -1.03106689453125, -0.779052734375, -0.52703857421875, -0.2750244140625, -0.02301025390625, 0.22900390625, 0.48101806640625, 0.7330322265625, 0.98504638671875, 1.237060546875, 1.48907470703125, 1.7410888671875, 1.99310302734375, 2.2451171875, 2.49713134765625, 2.7491455078125, 3.00115966796875, 3.253173828125, 3.50518798828125, 3.7572021484375, 4.00921630859375, 4.26123046875, 4.51324462890625, 4.7652587890625, 5.01727294921875, 5.269287109375, 5.52130126953125, 5.7733154296875, 6.02532958984375, 6.27734375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 6.0, 10.0, 8.0, 20.0, 34.0, 41.0, 65.0, 92.0, 178.0, 276.0, 459.0, 915.0, 1487.0, 2733.0, 4900.0, 9130.0, 16919.0, 33192.0, 67021.0, 152260.0, 398583.0, 196503.0, 80644.0, 39106.0, 19959.0, 10967.0, 5824.0, 3110.0, 1759.0, 1003.0, 554.0, 316.0, 163.0, 120.0, 70.0, 39.0, 26.0, 17.0, 11.0, 10.0, 10.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8935546875, -1.83367919921875, -1.7738037109375, -1.71392822265625, -1.654052734375, -1.59417724609375, -1.5343017578125, -1.47442626953125, -1.41455078125, -1.35467529296875, -1.2947998046875, -1.23492431640625, -1.175048828125, -1.11517333984375, -1.0552978515625, -0.99542236328125, -0.935546875, -0.87567138671875, -0.8157958984375, -0.75592041015625, -0.696044921875, -0.63616943359375, -0.5762939453125, -0.51641845703125, -0.45654296875, -0.39666748046875, -0.3367919921875, -0.27691650390625, -0.217041015625, -0.15716552734375, -0.0972900390625, -0.03741455078125, 0.0224609375, 0.08233642578125, 0.1422119140625, 0.20208740234375, 0.261962890625, 0.32183837890625, 0.3817138671875, 0.44158935546875, 0.50146484375, 0.56134033203125, 0.6212158203125, 0.68109130859375, 0.740966796875, 0.80084228515625, 0.8607177734375, 0.92059326171875, 0.98046875, 1.04034423828125, 1.1002197265625, 1.16009521484375, 1.219970703125, 1.27984619140625, 1.3397216796875, 1.39959716796875, 1.45947265625, 1.51934814453125, 1.5792236328125, 1.63909912109375, 1.698974609375, 1.75885009765625, 1.8187255859375, 1.87860107421875, 1.9384765625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 5.0, 11.0, 10.0, 9.0, 20.0, 11.0, 14.0, 15.0, 23.0, 25.0, 28.0, 23.0, 29.0, 38.0, 47.0, 29.0, 35.0, 39.0, 29.0, 1059.0, 47.0, 47.0, 53.0, 44.0, 34.0, 37.0, 33.0, 24.0, 37.0, 26.0, 16.0, 25.0, 15.0, 5.0, 12.0, 11.0, 11.0, 8.0, 7.0, 6.0, 4.0, 6.0, 5.0, 1.0, 6.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.5078125, -4.376922607421875, -4.24603271484375, -4.115142822265625, -3.9842529296875, -3.853363037109375, -3.72247314453125, -3.591583251953125, -3.460693359375, -3.329803466796875, -3.19891357421875, -3.068023681640625, -2.9371337890625, -2.806243896484375, -2.67535400390625, -2.544464111328125, -2.41357421875, -2.282684326171875, -2.15179443359375, -2.020904541015625, -1.8900146484375, -1.759124755859375, -1.62823486328125, -1.497344970703125, -1.366455078125, -1.235565185546875, -1.10467529296875, -0.973785400390625, -0.8428955078125, -0.712005615234375, -0.58111572265625, -0.450225830078125, -0.3193359375, -0.188446044921875, -0.05755615234375, 0.073333740234375, 0.2042236328125, 0.335113525390625, 0.46600341796875, 0.596893310546875, 0.727783203125, 0.858673095703125, 0.98956298828125, 1.120452880859375, 1.2513427734375, 1.382232666015625, 1.51312255859375, 1.644012451171875, 1.77490234375, 1.905792236328125, 2.03668212890625, 2.167572021484375, 2.2984619140625, 2.429351806640625, 2.56024169921875, 2.691131591796875, 2.822021484375, 2.952911376953125, 3.08380126953125, 3.214691162109375, 3.3455810546875, 3.476470947265625, 3.60736083984375, 3.738250732421875, 3.869140625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 4.0, 10.0, 5.0, 5.0, 11.0, 16.0, 14.0, 32.0, 37.0, 70.0, 122.0, 219.0, 397.0, 709.0, 1263.0, 2329.0, 4198.0, 7749.0, 14932.0, 29414.0, 61291.0, 150198.0, 1491478.0, 189269.0, 72888.0, 33694.0, 17159.0, 9031.0, 4655.0, 2622.0, 1476.0, 755.0, 472.0, 252.0, 140.0, 66.0, 45.0, 37.0, 19.0, 14.0, 10.0, 8.0, 6.0, 2.0, 0.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.892578125, -1.828643798828125, -1.76470947265625, -1.700775146484375, -1.6368408203125, -1.572906494140625, -1.50897216796875, -1.445037841796875, -1.381103515625, -1.317169189453125, -1.25323486328125, -1.189300537109375, -1.1253662109375, -1.061431884765625, -0.99749755859375, -0.933563232421875, -0.86962890625, -0.805694580078125, -0.74176025390625, -0.677825927734375, -0.6138916015625, -0.549957275390625, -0.48602294921875, -0.422088623046875, -0.358154296875, -0.294219970703125, -0.23028564453125, -0.166351318359375, -0.1024169921875, -0.038482666015625, 0.02545166015625, 0.089385986328125, 0.1533203125, 0.217254638671875, 0.28118896484375, 0.345123291015625, 0.4090576171875, 0.472991943359375, 0.53692626953125, 0.600860595703125, 0.664794921875, 0.728729248046875, 0.79266357421875, 0.856597900390625, 0.9205322265625, 0.984466552734375, 1.04840087890625, 1.112335205078125, 1.17626953125, 1.240203857421875, 1.30413818359375, 1.368072509765625, 1.4320068359375, 1.495941162109375, 1.55987548828125, 1.623809814453125, 1.687744140625, 1.751678466796875, 1.81561279296875, 1.879547119140625, 1.9434814453125, 2.007415771484375, 2.07135009765625, 2.135284423828125, 2.19921875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 5.0, 6.0, 5.0, 8.0, 12.0, 21.0, 19.0, 28.0, 36.0, 31.0, 38.0, 59.0, 75.0, 82.0, 104.0, 90.0, 74.0, 49.0, 51.0, 34.0, 35.0, 31.0, 24.0, 18.0, 9.0, 12.0, 10.0, 4.0, 6.0, 5.0, 6.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0011358261108398438, -0.0011020451784133911, -0.0010682642459869385, -0.0010344833135604858, -0.0010007023811340332, -0.0009669214487075806, -0.0009331405162811279, -0.0008993595838546753, -0.0008655786514282227, -0.00083179771900177, -0.0007980167865753174, -0.0007642358541488647, -0.0007304549217224121, -0.0006966739892959595, -0.0006628930568695068, -0.0006291121244430542, -0.0005953311920166016, -0.0005615502595901489, -0.0005277693271636963, -0.0004939883947372437, -0.000460207462310791, -0.0004264265298843384, -0.00039264559745788574, -0.0003588646650314331, -0.00032508373260498047, -0.00029130280017852783, -0.0002575218677520752, -0.00022374093532562256, -0.00018996000289916992, -0.00015617907047271729, -0.00012239813804626465, -8.861720561981201e-05, -5.4836273193359375e-05, -2.1055340766906738e-05, 1.2725591659545898e-05, 4.6506524085998535e-05, 8.028745651245117e-05, 0.00011406838893890381, 0.00014784932136535645, 0.00018163025379180908, 0.00021541118621826172, 0.00024919211864471436, 0.000282973051071167, 0.00031675398349761963, 0.00035053491592407227, 0.0003843158483505249, 0.00041809678077697754, 0.0004518777132034302, 0.0004856586456298828, 0.0005194395780563354, 0.0005532205104827881, 0.0005870014429092407, 0.0006207823753356934, 0.000654563307762146, 0.0006883442401885986, 0.0007221251726150513, 0.0007559061050415039, 0.0007896870374679565, 0.0008234679698944092, 0.0008572489023208618, 0.0008910298347473145, 0.0009248107671737671, 0.0009585916996002197, 0.0009923726320266724, 0.001026153564453125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 6.0, 4.0, 6.0, 12.0, 9.0, 7.0, 15.0, 17.0, 37.0, 29.0, 56.0, 55.0, 85.0, 157.0, 370.0, 1765.0, 1033900.0, 10875.0, 539.0, 244.0, 107.0, 58.0, 45.0, 35.0, 36.0, 28.0, 12.0, 9.0, 11.0, 10.0, 3.0, 3.0, 2.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02423095703125, -0.02341461181640625, -0.0225982666015625, -0.02178192138671875, -0.020965576171875, -0.02014923095703125, -0.0193328857421875, -0.01851654052734375, -0.0177001953125, -0.01688385009765625, -0.0160675048828125, -0.01525115966796875, -0.014434814453125, -0.01361846923828125, -0.0128021240234375, -0.01198577880859375, -0.01116943359375, -0.01035308837890625, -0.0095367431640625, -0.00872039794921875, -0.007904052734375, -0.00708770751953125, -0.0062713623046875, -0.00545501708984375, -0.004638671875, -0.00382232666015625, -0.0030059814453125, -0.00218963623046875, -0.001373291015625, -0.00055694580078125, 0.0002593994140625, 0.00107574462890625, 0.00189208984375, 0.00270843505859375, 0.0035247802734375, 0.00434112548828125, 0.005157470703125, 0.00597381591796875, 0.0067901611328125, 0.00760650634765625, 0.0084228515625, 0.00923919677734375, 0.0100555419921875, 0.01087188720703125, 0.011688232421875, 0.01250457763671875, 0.0133209228515625, 0.01413726806640625, 0.01495361328125, 0.01576995849609375, 0.0165863037109375, 0.01740264892578125, 0.018218994140625, 0.01903533935546875, 0.0198516845703125, 0.02066802978515625, 0.021484375, 0.02230072021484375, 0.0231170654296875, 0.02393341064453125, 0.024749755859375, 0.02556610107421875, 0.0263824462890625, 0.02719879150390625, 0.02801513671875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 13.0, 21.0, 62.0, 100.0, 158.0, 210.0, 194.0, 122.0, 65.0, 40.0, 18.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007253868388943374, -0.0006991919362917542, -0.0006729970336891711, -0.0006468021310865879, -0.0006206072284840047, -0.0005944123258814216, -0.0005682174232788384, -0.0005420225206762552, -0.0005158276180736721, -0.0004896327154710889, -0.0004634378128685057, -0.00043724291026592255, -0.0004110480076633394, -0.0003848531050607562, -0.00035865820245817304, -0.00033246329985558987, -0.0003062683972530067, -0.0002800734946504235, -0.00025387859204784036, -0.0002276836894452572, -0.00020148878684267402, -0.00017529388424009085, -0.00014909898163750768, -0.0001229040790349245, -9.670917643234134e-05, -7.051427382975817e-05, -4.4319371227175e-05, -1.8124468624591827e-05, 8.070433977991343e-06, 3.426533658057451e-05, 6.046023918315768e-05, 8.665514178574085e-05, 0.00011285010259598494, 0.0001390450051985681, 0.00016523990780115128, 0.00019143481040373445, 0.00021762971300631762, 0.00024382461560890079, 0.00027001951821148396, 0.0002962144208140671, 0.0003224093234166503, 0.00034860422601923347, 0.00037479912862181664, 0.0004009940312243998, 0.000427188933826983, 0.00045338383642956614, 0.0004795787390321493, 0.0005057736416347325, 0.0005319685442373157, 0.0005581634468398988, 0.000584358349442482, 0.0006105532520450652, 0.0006367481546476483, 0.0006629430572502315, 0.0006891379598528147, 0.0007153328624553978, 0.000741527765057981, 0.0007677226676605642, 0.0007939175702631474, 0.0008201124728657305, 0.0008463073754683137, 0.0008725022780708969, 0.00089869718067348, 0.0009248920832760632, 0.0009510869858786464]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 4.0, 6.0, 10.0, 12.0, 10.0, 13.0, 19.0, 11.0, 19.0, 9.0, 20.0, 33.0, 32.0, 19.0, 38.0, 31.0, 25.0, 33.0, 39.0, 48.0, 49.0, 55.0, 49.0, 53.0, 33.0, 34.0, 31.0, 31.0, 25.0, 27.0, 22.0, 25.0, 23.0, 17.0, 9.0, 18.0, 10.0, 18.0, 14.0, 10.0, 3.0, 7.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004163384437561035, -0.00040195975452661514, -0.00038758106529712677, -0.0003732023760676384, -0.00035882368683815, -0.00034444499760866165, -0.0003300663083791733, -0.0003156876191496849, -0.00030130892992019653, -0.00028693024069070816, -0.0002725515514612198, -0.0002581728622317314, -0.00024379417300224304, -0.00022941548377275467, -0.0002150367945432663, -0.00020065810531377792, -0.00018627941608428955, -0.00017190072685480118, -0.0001575220376253128, -0.00014314334839582443, -0.00012876465916633606, -0.00011438596993684769, -0.00010000728070735931, -8.562859147787094e-05, -7.124990224838257e-05, -5.6871213018894196e-05, -4.249252378940582e-05, -2.811383455991745e-05, -1.3735145330429077e-05, 6.435438990592957e-07, 1.5022233128547668e-05, 2.940092235803604e-05, 4.3779611587524414e-05, 5.815830081701279e-05, 7.253699004650116e-05, 8.691567927598953e-05, 0.0001012943685054779, 0.00011567305773496628, 0.00013005174696445465, 0.00014443043619394302, 0.0001588091254234314, 0.00017318781465291977, 0.00018756650388240814, 0.00020194519311189651, 0.0002163238823413849, 0.00023070257157087326, 0.00024508126080036163, 0.00025945995002985, 0.0002738386392593384, 0.00028821732848882675, 0.0003025960177183151, 0.0003169747069478035, 0.00033135339617729187, 0.00034573208540678024, 0.0003601107746362686, 0.000374489463865757, 0.00038886815309524536, 0.00040324684232473373, 0.0004176255315542221, 0.0004320042207837105, 0.00044638291001319885, 0.0004607615992426872, 0.0004751402884721756, 0.000489518977701664, 0.0005038976669311523]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 7.0, 5.0, 9.0, 5.0, 10.0, 21.0, 11.0, 25.0, 20.0, 14.0, 34.0, 36.0, 50.0, 43.0, 64.0, 47.0, 39.0, 44.0, 61.0, 52.0, 56.0, 40.0, 48.0, 38.0, 41.0, 39.0, 23.0, 24.0, 22.0, 30.0, 18.0, 11.0, 8.0, 1.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.8515625, -9.59954833984375, -9.3475341796875, -9.09552001953125, -8.843505859375, -8.59149169921875, -8.3394775390625, -8.08746337890625, -7.83544921875, -7.58343505859375, -7.3314208984375, -7.07940673828125, -6.827392578125, -6.57537841796875, -6.3233642578125, -6.07135009765625, -5.8193359375, -5.56732177734375, -5.3153076171875, -5.06329345703125, -4.811279296875, -4.55926513671875, -4.3072509765625, -4.05523681640625, -3.80322265625, -3.55120849609375, -3.2991943359375, -3.04718017578125, -2.795166015625, -2.54315185546875, -2.2911376953125, -2.03912353515625, -1.787109375, -1.53509521484375, -1.2830810546875, -1.03106689453125, -0.779052734375, -0.52703857421875, -0.2750244140625, -0.02301025390625, 0.22900390625, 0.48101806640625, 0.7330322265625, 0.98504638671875, 1.237060546875, 1.48907470703125, 1.7410888671875, 1.99310302734375, 2.2451171875, 2.49713134765625, 2.7491455078125, 3.00115966796875, 3.253173828125, 3.50518798828125, 3.7572021484375, 4.00921630859375, 4.26123046875, 4.51324462890625, 4.7652587890625, 5.01727294921875, 5.269287109375, 5.52130126953125, 5.7733154296875, 6.02532958984375, 6.27734375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 5.0, 2.0, 6.0, 6.0, 9.0, 11.0, 15.0, 25.0, 35.0, 52.0, 87.0, 127.0, 212.0, 386.0, 777.0, 1771.0, 4738.0, 17530.0, 87756.0, 582661.0, 289536.0, 46290.0, 10650.0, 3193.0, 1203.0, 582.0, 339.0, 215.0, 111.0, 74.0, 44.0, 46.0, 22.0, 18.0, 6.0, 5.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.609375, -9.36181640625, -9.1142578125, -8.86669921875, -8.619140625, -8.37158203125, -8.1240234375, -7.87646484375, -7.62890625, -7.38134765625, -7.1337890625, -6.88623046875, -6.638671875, -6.39111328125, -6.1435546875, -5.89599609375, -5.6484375, -5.40087890625, -5.1533203125, -4.90576171875, -4.658203125, -4.41064453125, -4.1630859375, -3.91552734375, -3.66796875, -3.42041015625, -3.1728515625, -2.92529296875, -2.677734375, -2.43017578125, -2.1826171875, -1.93505859375, -1.6875, -1.43994140625, -1.1923828125, -0.94482421875, -0.697265625, -0.44970703125, -0.2021484375, 0.04541015625, 0.29296875, 0.54052734375, 0.7880859375, 1.03564453125, 1.283203125, 1.53076171875, 1.7783203125, 2.02587890625, 2.2734375, 2.52099609375, 2.7685546875, 3.01611328125, 3.263671875, 3.51123046875, 3.7587890625, 4.00634765625, 4.25390625, 4.50146484375, 4.7490234375, 4.99658203125, 5.244140625, 5.49169921875, 5.7392578125, 5.98681640625, 6.234375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 2.0, 5.0, 6.0, 3.0, 8.0, 11.0, 14.0, 10.0, 20.0, 20.0, 21.0, 23.0, 25.0, 25.0, 27.0, 33.0, 28.0, 56.0, 45.0, 57.0, 87.0, 335.0, 1597.0, 139.0, 55.0, 44.0, 44.0, 31.0, 40.0, 34.0, 32.0, 26.0, 15.0, 23.0, 19.0, 13.0, 20.0, 9.0, 14.0, 5.0, 10.0, 5.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.28125, -20.619384765625, -19.95751953125, -19.295654296875, -18.6337890625, -17.971923828125, -17.31005859375, -16.648193359375, -15.986328125, -15.324462890625, -14.66259765625, -14.000732421875, -13.3388671875, -12.677001953125, -12.01513671875, -11.353271484375, -10.69140625, -10.029541015625, -9.36767578125, -8.705810546875, -8.0439453125, -7.382080078125, -6.72021484375, -6.058349609375, -5.396484375, -4.734619140625, -4.07275390625, -3.410888671875, -2.7490234375, -2.087158203125, -1.42529296875, -0.763427734375, -0.1015625, 0.560302734375, 1.22216796875, 1.884033203125, 2.5458984375, 3.207763671875, 3.86962890625, 4.531494140625, 5.193359375, 5.855224609375, 6.51708984375, 7.178955078125, 7.8408203125, 8.502685546875, 9.16455078125, 9.826416015625, 10.48828125, 11.150146484375, 11.81201171875, 12.473876953125, 13.1357421875, 13.797607421875, 14.45947265625, 15.121337890625, 15.783203125, 16.445068359375, 17.10693359375, 17.768798828125, 18.4306640625, 19.092529296875, 19.75439453125, 20.416259765625, 21.078125]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 12.0, 20.0, 37.0, 53.0, 89.0, 233.0, 501.0, 3016.0, 3138263.0, 2521.0, 515.0, 202.0, 97.0, 64.0, 26.0, 23.0, 10.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.3125, -121.0615234375, -116.810546875, -112.5595703125, -108.30859375, -104.0576171875, -99.806640625, -95.5556640625, -91.3046875, -87.0537109375, -82.802734375, -78.5517578125, -74.30078125, -70.0498046875, -65.798828125, -61.5478515625, -57.296875, -53.0458984375, -48.794921875, -44.5439453125, -40.29296875, -36.0419921875, -31.791015625, -27.5400390625, -23.2890625, -19.0380859375, -14.787109375, -10.5361328125, -6.28515625, -2.0341796875, 2.216796875, 6.4677734375, 10.71875, 14.9697265625, 19.220703125, 23.4716796875, 27.72265625, 31.9736328125, 36.224609375, 40.4755859375, 44.7265625, 48.9775390625, 53.228515625, 57.4794921875, 61.73046875, 65.9814453125, 70.232421875, 74.4833984375, 78.734375, 82.9853515625, 87.236328125, 91.4873046875, 95.73828125, 99.9892578125, 104.240234375, 108.4912109375, 112.7421875, 116.9931640625, 121.244140625, 125.4951171875, 129.74609375, 133.9970703125, 138.248046875, 142.4990234375, 146.75]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 9.0, 89.0, 398.0, 417.0, 95.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.34880065917969, -31.117483139038086, -28.886165618896484, -26.65484619140625, -24.42352867126465, -22.192211151123047, -19.960891723632812, -17.72957420349121, -15.49825668334961, -13.266939163208008, -11.03562068939209, -8.804302215576172, -6.57298469543457, -4.341667175292969, -2.110348701477051, 0.12096977233886719, 2.3522872924804688, 4.5836052894592285, 6.814923286437988, 9.046241760253906, 11.277559280395508, 13.50887680053711, 15.740195274353027, 17.971513748168945, 20.202831268310547, 22.43414878845215, 24.66546630859375, 26.896785736083984, 29.128103256225586, 31.359420776367188, 33.59074020385742, 35.822059631347656, 38.053382873535156, 40.28470230102539, 42.51601791381836, 44.747337341308594, 46.97865295410156, 49.2099723815918, 51.44129180908203, 53.672607421875, 55.903926849365234, 58.13524627685547, 60.36656188964844, 62.59788131713867, 64.8292007446289, 67.06051635742188, 69.29183197021484, 71.52315521240234, 73.75447082519531, 75.98578643798828, 78.21710968017578, 80.44842529296875, 82.67974090576172, 84.91105651855469, 87.14237976074219, 89.37369537353516, 91.60501098632812, 93.8363265991211, 96.0676498413086, 98.29896545410156, 100.53028106689453, 102.7615966796875, 104.992919921875, 107.22423553466797, 109.45555877685547]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 6.0, 2.0, 11.0, 12.0, 9.0, 19.0, 23.0, 23.0, 24.0, 39.0, 41.0, 36.0, 32.0, 41.0, 50.0, 43.0, 48.0, 51.0, 45.0, 46.0, 46.0, 36.0, 42.0, 33.0, 38.0, 28.0, 32.0, 25.0, 21.0, 26.0, 14.0, 10.0, 8.0, 8.0, 10.0, 6.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-65.46469116210938, -63.58001708984375, -61.69533920288086, -59.81066131591797, -57.925987243652344, -56.04131317138672, -54.15663528442383, -52.27195739746094, -50.38728332519531, -48.50260925292969, -46.6179313659668, -44.733253479003906, -42.84857940673828, -40.963905334472656, -39.079227447509766, -37.194549560546875, -35.30987548828125, -33.425201416015625, -31.540523529052734, -29.655847549438477, -27.77117156982422, -25.88649559020996, -24.001819610595703, -22.117143630981445, -20.232467651367188, -18.34779167175293, -16.463115692138672, -14.578439712524414, -12.693763732910156, -10.809087753295898, -8.92441177368164, -7.039735794067383, -5.155059814453125, -3.270383834838867, -1.3857078552246094, 0.49896812438964844, 2.3836441040039062, 4.268320083618164, 6.152996063232422, 8.03767204284668, 9.922348022460938, 11.807024002075195, 13.691699981689453, 15.576375961303711, 17.46105194091797, 19.345727920532227, 21.230403900146484, 23.115079879760742, 24.999755859375, 26.884431838989258, 28.769107818603516, 30.653783798217773, 32.53845977783203, 34.423133850097656, 36.30781173706055, 38.19248962402344, 40.07716369628906, 41.96183776855469, 43.84651565551758, 45.73119354248047, 47.615867614746094, 49.50054168701172, 51.38521957397461, 53.2698974609375, 55.154571533203125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 2.0, 3.0, 7.0, 12.0, 15.0, 15.0, 17.0, 23.0, 14.0, 22.0, 35.0, 26.0, 42.0, 48.0, 58.0, 46.0, 49.0, 44.0, 54.0, 42.0, 51.0, 46.0, 46.0, 41.0, 39.0, 35.0, 33.0, 21.0, 23.0, 29.0, 24.0, 14.0, 9.0, 6.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.35845947265625, -9.1075439453125, -8.85662841796875, -8.605712890625, -8.35479736328125, -8.1038818359375, -7.85296630859375, -7.60205078125, -7.35113525390625, -7.1002197265625, -6.84930419921875, -6.598388671875, -6.34747314453125, -6.0965576171875, -5.84564208984375, -5.5947265625, -5.34381103515625, -5.0928955078125, -4.84197998046875, -4.591064453125, -4.34014892578125, -4.0892333984375, -3.83831787109375, -3.58740234375, -3.33648681640625, -3.0855712890625, -2.83465576171875, -2.583740234375, -2.33282470703125, -2.0819091796875, -1.83099365234375, -1.580078125, -1.32916259765625, -1.0782470703125, -0.82733154296875, -0.576416015625, -0.32550048828125, -0.0745849609375, 0.17633056640625, 0.42724609375, 0.67816162109375, 0.9290771484375, 1.17999267578125, 1.430908203125, 1.68182373046875, 1.9327392578125, 2.18365478515625, 2.4345703125, 2.68548583984375, 2.9364013671875, 3.18731689453125, 3.438232421875, 3.68914794921875, 3.9400634765625, 4.19097900390625, 4.44189453125, 4.69281005859375, 4.9437255859375, 5.19464111328125, 5.445556640625, 5.69647216796875, 5.9473876953125, 6.19830322265625, 6.44921875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 5.0, 6.0, 7.0, 14.0, 17.0, 17.0, 29.0, 31.0, 34.0, 40.0, 48.0, 70.0, 100.0, 95.0, 154.0, 277.0, 506.0, 1512.0, 8292.0, 135607.0, 2432619.0, 1545250.0, 61809.0, 5276.0, 1103.0, 435.0, 248.0, 149.0, 120.0, 89.0, 61.0, 56.0, 49.0, 38.0, 31.0, 22.0, 17.0, 7.0, 12.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.078125, -19.50244140625, -18.9267578125, -18.35107421875, -17.775390625, -17.19970703125, -16.6240234375, -16.04833984375, -15.47265625, -14.89697265625, -14.3212890625, -13.74560546875, -13.169921875, -12.59423828125, -12.0185546875, -11.44287109375, -10.8671875, -10.29150390625, -9.7158203125, -9.14013671875, -8.564453125, -7.98876953125, -7.4130859375, -6.83740234375, -6.26171875, -5.68603515625, -5.1103515625, -4.53466796875, -3.958984375, -3.38330078125, -2.8076171875, -2.23193359375, -1.65625, -1.08056640625, -0.5048828125, 0.07080078125, 0.646484375, 1.22216796875, 1.7978515625, 2.37353515625, 2.94921875, 3.52490234375, 4.1005859375, 4.67626953125, 5.251953125, 5.82763671875, 6.4033203125, 6.97900390625, 7.5546875, 8.13037109375, 8.7060546875, 9.28173828125, 9.857421875, 10.43310546875, 11.0087890625, 11.58447265625, 12.16015625, 12.73583984375, 13.3115234375, 13.88720703125, 14.462890625, 15.03857421875, 15.6142578125, 16.18994140625, 16.765625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 6.0, 9.0, 12.0, 30.0, 27.0, 46.0, 54.0, 91.0, 122.0, 181.0, 270.0, 397.0, 505.0, 586.0, 516.0, 383.0, 265.0, 185.0, 123.0, 89.0, 60.0, 23.0, 26.0, 19.0, 9.0, 11.0, 10.0, 2.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7734375, -15.286376953125, -14.79931640625, -14.312255859375, -13.8251953125, -13.338134765625, -12.85107421875, -12.364013671875, -11.876953125, -11.389892578125, -10.90283203125, -10.415771484375, -9.9287109375, -9.441650390625, -8.95458984375, -8.467529296875, -7.98046875, -7.493408203125, -7.00634765625, -6.519287109375, -6.0322265625, -5.545166015625, -5.05810546875, -4.571044921875, -4.083984375, -3.596923828125, -3.10986328125, -2.622802734375, -2.1357421875, -1.648681640625, -1.16162109375, -0.674560546875, -0.1875, 0.299560546875, 0.78662109375, 1.273681640625, 1.7607421875, 2.247802734375, 2.73486328125, 3.221923828125, 3.708984375, 4.196044921875, 4.68310546875, 5.170166015625, 5.6572265625, 6.144287109375, 6.63134765625, 7.118408203125, 7.60546875, 8.092529296875, 8.57958984375, 9.066650390625, 9.5537109375, 10.040771484375, 10.52783203125, 11.014892578125, 11.501953125, 11.989013671875, 12.47607421875, 12.963134765625, 13.4501953125, 13.937255859375, 14.42431640625, 14.911376953125, 15.3984375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 6.0, 7.0, 11.0, 15.0, 27.0, 35.0, 48.0, 56.0, 90.0, 148.0, 195.0, 252.0, 402.0, 825.0, 12795.0, 4155086.0, 22119.0, 801.0, 421.0, 288.0, 162.0, 123.0, 111.0, 73.0, 52.0, 40.0, 30.0, 22.0, 11.0, 6.0, 11.0, 6.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.9375, -73.451171875, -70.96484375, -68.478515625, -65.9921875, -63.505859375, -61.01953125, -58.533203125, -56.046875, -53.560546875, -51.07421875, -48.587890625, -46.1015625, -43.615234375, -41.12890625, -38.642578125, -36.15625, -33.669921875, -31.18359375, -28.697265625, -26.2109375, -23.724609375, -21.23828125, -18.751953125, -16.265625, -13.779296875, -11.29296875, -8.806640625, -6.3203125, -3.833984375, -1.34765625, 1.138671875, 3.625, 6.111328125, 8.59765625, 11.083984375, 13.5703125, 16.056640625, 18.54296875, 21.029296875, 23.515625, 26.001953125, 28.48828125, 30.974609375, 33.4609375, 35.947265625, 38.43359375, 40.919921875, 43.40625, 45.892578125, 48.37890625, 50.865234375, 53.3515625, 55.837890625, 58.32421875, 60.810546875, 63.296875, 65.783203125, 68.26953125, 70.755859375, 73.2421875, 75.728515625, 78.21484375, 80.701171875, 83.1875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 10.0, 103.0, 417.0, 383.0, 92.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-276.5157165527344, -269.75860595703125, -263.0014953613281, -256.2444152832031, -249.4873046875, -242.73019409179688, -235.97308349609375, -229.2159881591797, -222.45889282226562, -215.7017822265625, -208.94468688964844, -202.1875762939453, -195.43048095703125, -188.67337036132812, -181.916259765625, -175.15916442871094, -168.4020538330078, -161.6449432373047, -154.88784790039062, -148.1307373046875, -141.37364196777344, -134.6165313720703, -127.85942840576172, -121.10232543945312, -114.34522247314453, -107.58811950683594, -100.83101654052734, -94.07391357421875, -87.31680297851562, -80.55970764160156, -73.80259704589844, -67.04549407958984, -60.28837585449219, -53.531272888183594, -46.774169921875, -40.01706314086914, -33.25996017456055, -26.502857208251953, -19.745750427246094, -12.9886474609375, -6.231544494628906, 0.5255594253540039, 7.282663345336914, 14.03976821899414, 20.796871185302734, 27.553974151611328, 34.31108093261719, 41.06818389892578, 47.825286865234375, 54.58238983154297, 61.33949279785156, 68.09660339355469, 74.85369873046875, 81.61080932617188, 88.36791229248047, 95.12501525878906, 101.88211822509766, 108.63922119140625, 115.39632415771484, 122.15342712402344, 128.91053771972656, 135.66763305664062, 142.42474365234375, 149.18185424804688, 155.93894958496094]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 3.0, 5.0, 10.0, 3.0, 7.0, 11.0, 11.0, 16.0, 15.0, 25.0, 14.0, 23.0, 33.0, 28.0, 26.0, 45.0, 33.0, 46.0, 38.0, 39.0, 54.0, 53.0, 42.0, 46.0, 36.0, 52.0, 29.0, 34.0, 33.0, 30.0, 23.0, 22.0, 28.0, 20.0, 18.0, 11.0, 4.0, 9.0, 9.0, 5.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-52.642974853515625, -51.22309112548828, -49.80320358276367, -48.38331604003906, -46.96343231201172, -45.543548583984375, -44.123661041259766, -42.703773498535156, -41.28388977050781, -39.86400604248047, -38.44411849975586, -37.02423095703125, -35.604347229003906, -34.18446350097656, -32.76457595825195, -31.344690322875977, -29.9248046875, -28.504919052124023, -27.085033416748047, -25.66514778137207, -24.245262145996094, -22.825376510620117, -21.40549087524414, -19.985605239868164, -18.565719604492188, -17.14583396911621, -15.725948333740234, -14.306062698364258, -12.886177062988281, -11.466291427612305, -10.046405792236328, -8.626520156860352, -7.206634521484375, -5.786748886108398, -4.366863250732422, -2.9469776153564453, -1.5270919799804688, -0.10720634460449219, 1.3126792907714844, 2.732564926147461, 4.1524505615234375, 5.572336196899414, 6.992221832275391, 8.412107467651367, 9.831993103027344, 11.25187873840332, 12.671764373779297, 14.091650009155273, 15.51153564453125, 16.931421279907227, 18.351306915283203, 19.77119255065918, 21.191078186035156, 22.610963821411133, 24.03084945678711, 25.450735092163086, 26.870620727539062, 28.29050636291504, 29.710391998291016, 31.130277633666992, 32.55016326904297, 33.97004699707031, 35.38993453979492, 36.80982208251953, 38.229705810546875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 7.0, 7.0, 8.0, 8.0, 13.0, 8.0, 14.0, 14.0, 14.0, 18.0, 18.0, 23.0, 27.0, 26.0, 28.0, 44.0, 36.0, 35.0, 33.0, 31.0, 35.0, 43.0, 25.0, 32.0, 37.0, 33.0, 44.0, 24.0, 42.0, 27.0, 27.0, 23.0, 25.0, 24.0, 24.0, 18.0, 20.0, 17.0, 18.0, 7.0, 11.0, 7.0, 7.0, 1.0, 9.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.9921875, -5.81292724609375, -5.6336669921875, -5.45440673828125, -5.275146484375, -5.09588623046875, -4.9166259765625, -4.73736572265625, -4.55810546875, -4.37884521484375, -4.1995849609375, -4.02032470703125, -3.841064453125, -3.66180419921875, -3.4825439453125, -3.30328369140625, -3.1240234375, -2.94476318359375, -2.7655029296875, -2.58624267578125, -2.406982421875, -2.22772216796875, -2.0484619140625, -1.86920166015625, -1.68994140625, -1.51068115234375, -1.3314208984375, -1.15216064453125, -0.972900390625, -0.79364013671875, -0.6143798828125, -0.43511962890625, -0.255859375, -0.07659912109375, 0.1026611328125, 0.28192138671875, 0.461181640625, 0.64044189453125, 0.8197021484375, 0.99896240234375, 1.17822265625, 1.35748291015625, 1.5367431640625, 1.71600341796875, 1.895263671875, 2.07452392578125, 2.2537841796875, 2.43304443359375, 2.6123046875, 2.79156494140625, 2.9708251953125, 3.15008544921875, 3.329345703125, 3.50860595703125, 3.6878662109375, 3.86712646484375, 4.04638671875, 4.22564697265625, 4.4049072265625, 4.58416748046875, 4.763427734375, 4.94268798828125, 5.1219482421875, 5.30120849609375, 5.48046875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 4.0, 6.0, 14.0, 18.0, 20.0, 25.0, 39.0, 85.0, 78.0, 111.0, 175.0, 238.0, 319.0, 469.0, 689.0, 997.0, 1463.0, 2152.0, 3107.0, 4482.0, 6766.0, 9782.0, 14837.0, 21960.0, 32901.0, 51290.0, 83634.0, 158844.0, 280668.0, 147679.0, 79871.0, 48877.0, 31766.0, 20945.0, 13866.0, 9735.0, 6558.0, 4437.0, 3055.0, 2029.0, 1354.0, 1021.0, 652.0, 480.0, 286.0, 230.0, 165.0, 123.0, 67.0, 59.0, 45.0, 26.0, 19.0, 18.0, 10.0, 4.0, 6.0, 5.0, 3.0, 1.0, 1.0], "bins": [-1.1513671875, -1.1147613525390625, -1.078155517578125, -1.0415496826171875, -1.00494384765625, -0.9683380126953125, -0.931732177734375, -0.8951263427734375, -0.8585205078125, -0.8219146728515625, -0.785308837890625, -0.7487030029296875, -0.71209716796875, -0.6754913330078125, -0.638885498046875, -0.6022796630859375, -0.565673828125, -0.5290679931640625, -0.492462158203125, -0.4558563232421875, -0.41925048828125, -0.3826446533203125, -0.346038818359375, -0.3094329833984375, -0.2728271484375, -0.2362213134765625, -0.199615478515625, -0.1630096435546875, -0.12640380859375, -0.0897979736328125, -0.053192138671875, -0.0165863037109375, 0.02001953125, 0.0566253662109375, 0.093231201171875, 0.1298370361328125, 0.16644287109375, 0.2030487060546875, 0.239654541015625, 0.2762603759765625, 0.3128662109375, 0.3494720458984375, 0.386077880859375, 0.4226837158203125, 0.45928955078125, 0.4958953857421875, 0.532501220703125, 0.5691070556640625, 0.605712890625, 0.6423187255859375, 0.678924560546875, 0.7155303955078125, 0.75213623046875, 0.7887420654296875, 0.825347900390625, 0.8619537353515625, 0.8985595703125, 0.9351654052734375, 0.971771240234375, 1.0083770751953125, 1.04498291015625, 1.0815887451171875, 1.118194580078125, 1.1548004150390625, 1.19140625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 8.0, 17.0, 8.0, 16.0, 18.0, 19.0, 21.0, 27.0, 20.0, 25.0, 25.0, 29.0, 42.0, 37.0, 54.0, 35.0, 34.0, 25.0, 1072.0, 39.0, 36.0, 37.0, 40.0, 33.0, 38.0, 39.0, 24.0, 31.0, 24.0, 20.0, 10.0, 14.0, 16.0, 22.0, 8.0, 16.0, 5.0, 4.0, 4.0, 9.0, 3.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-3.826171875, -3.7052001953125, -3.584228515625, -3.4632568359375, -3.34228515625, -3.2213134765625, -3.100341796875, -2.9793701171875, -2.8583984375, -2.7374267578125, -2.616455078125, -2.4954833984375, -2.37451171875, -2.2535400390625, -2.132568359375, -2.0115966796875, -1.890625, -1.7696533203125, -1.648681640625, -1.5277099609375, -1.40673828125, -1.2857666015625, -1.164794921875, -1.0438232421875, -0.9228515625, -0.8018798828125, -0.680908203125, -0.5599365234375, -0.43896484375, -0.3179931640625, -0.197021484375, -0.0760498046875, 0.044921875, 0.1658935546875, 0.286865234375, 0.4078369140625, 0.52880859375, 0.6497802734375, 0.770751953125, 0.8917236328125, 1.0126953125, 1.1336669921875, 1.254638671875, 1.3756103515625, 1.49658203125, 1.6175537109375, 1.738525390625, 1.8594970703125, 1.98046875, 2.1014404296875, 2.222412109375, 2.3433837890625, 2.46435546875, 2.5853271484375, 2.706298828125, 2.8272705078125, 2.9482421875, 3.0692138671875, 3.190185546875, 3.3111572265625, 3.43212890625, 3.5531005859375, 3.674072265625, 3.7950439453125, 3.916015625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 8.0, 4.0, 3.0, 7.0, 22.0, 17.0, 37.0, 43.0, 79.0, 139.0, 254.0, 401.0, 783.0, 1375.0, 2630.0, 4817.0, 9040.0, 16965.0, 33299.0, 68864.0, 169168.0, 1481625.0, 168617.0, 69026.0, 33254.0, 17065.0, 8986.0, 4783.0, 2599.0, 1350.0, 784.0, 430.0, 267.0, 127.0, 93.0, 56.0, 35.0, 20.0, 14.0, 15.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.9033203125, -1.844757080078125, -1.78619384765625, -1.727630615234375, -1.6690673828125, -1.610504150390625, -1.55194091796875, -1.493377685546875, -1.434814453125, -1.376251220703125, -1.31768798828125, -1.259124755859375, -1.2005615234375, -1.141998291015625, -1.08343505859375, -1.024871826171875, -0.96630859375, -0.907745361328125, -0.84918212890625, -0.790618896484375, -0.7320556640625, -0.673492431640625, -0.61492919921875, -0.556365966796875, -0.497802734375, -0.439239501953125, -0.38067626953125, -0.322113037109375, -0.2635498046875, -0.204986572265625, -0.14642333984375, -0.087860107421875, -0.029296875, 0.029266357421875, 0.08782958984375, 0.146392822265625, 0.2049560546875, 0.263519287109375, 0.32208251953125, 0.380645751953125, 0.439208984375, 0.497772216796875, 0.55633544921875, 0.614898681640625, 0.6734619140625, 0.732025146484375, 0.79058837890625, 0.849151611328125, 0.90771484375, 0.966278076171875, 1.02484130859375, 1.083404541015625, 1.1419677734375, 1.200531005859375, 1.25909423828125, 1.317657470703125, 1.376220703125, 1.434783935546875, 1.49334716796875, 1.551910400390625, 1.6104736328125, 1.669036865234375, 1.72760009765625, 1.786163330078125, 1.8447265625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 5.0, 4.0, 10.0, 14.0, 8.0, 8.0, 22.0, 22.0, 21.0, 27.0, 42.0, 46.0, 62.0, 69.0, 75.0, 101.0, 88.0, 71.0, 62.0, 46.0, 42.0, 35.0, 32.0, 21.0, 13.0, 13.0, 10.0, 5.0, 9.0, 2.0, 5.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008993148803710938, -0.0008688569068908691, -0.0008383989334106445, -0.0008079409599304199, -0.0007774829864501953, -0.0007470250129699707, -0.0007165670394897461, -0.0006861090660095215, -0.0006556510925292969, -0.0006251931190490723, -0.0005947351455688477, -0.000564277172088623, -0.0005338191986083984, -0.0005033612251281738, -0.0004729032516479492, -0.0004424452781677246, -0.0004119873046875, -0.0003815293312072754, -0.0003510713577270508, -0.00032061338424682617, -0.00029015541076660156, -0.00025969743728637695, -0.00022923946380615234, -0.00019878149032592773, -0.00016832351684570312, -0.00013786554336547852, -0.0001074075698852539, -7.69495964050293e-05, -4.649162292480469e-05, -1.6033649444580078e-05, 1.4424324035644531e-05, 4.488229751586914e-05, 7.534027099609375e-05, 0.00010579824447631836, 0.00013625621795654297, 0.00016671419143676758, 0.0001971721649169922, 0.0002276301383972168, 0.0002580881118774414, 0.000288546085357666, 0.0003190040588378906, 0.00034946203231811523, 0.00037992000579833984, 0.00041037797927856445, 0.00044083595275878906, 0.00047129392623901367, 0.0005017518997192383, 0.0005322098731994629, 0.0005626678466796875, 0.0005931258201599121, 0.0006235837936401367, 0.0006540417671203613, 0.0006844997406005859, 0.0007149577140808105, 0.0007454156875610352, 0.0007758736610412598, 0.0008063316345214844, 0.000836789608001709, 0.0008672475814819336, 0.0008977055549621582, 0.0009281635284423828, 0.0009586215019226074, 0.000989079475402832, 0.0010195374488830566, 0.0010499954223632812]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 3.0, 5.0, 6.0, 10.0, 11.0, 19.0, 25.0, 40.0, 53.0, 58.0, 107.0, 126.0, 307.0, 969.0, 355469.0, 689429.0, 1072.0, 332.0, 159.0, 89.0, 65.0, 49.0, 41.0, 23.0, 16.0, 18.0, 13.0, 10.0, 9.0, 3.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0246124267578125, -0.02388930320739746, -0.023166179656982422, -0.022443056106567383, -0.021719932556152344, -0.020996809005737305, -0.020273685455322266, -0.019550561904907227, -0.018827438354492188, -0.01810431480407715, -0.01738119125366211, -0.01665806770324707, -0.01593494415283203, -0.015211820602416992, -0.014488697052001953, -0.013765573501586914, -0.013042449951171875, -0.012319326400756836, -0.011596202850341797, -0.010873079299926758, -0.010149955749511719, -0.00942683219909668, -0.00870370864868164, -0.007980585098266602, -0.0072574615478515625, -0.0065343379974365234, -0.005811214447021484, -0.005088090896606445, -0.004364967346191406, -0.003641843795776367, -0.002918720245361328, -0.002195596694946289, -0.00147247314453125, -0.0007493495941162109, -2.6226043701171875e-05, 0.0006968975067138672, 0.0014200210571289062, 0.0021431446075439453, 0.0028662681579589844, 0.0035893917083740234, 0.0043125152587890625, 0.0050356388092041016, 0.005758762359619141, 0.00648188591003418, 0.007205009460449219, 0.007928133010864258, 0.008651256561279297, 0.009374380111694336, 0.010097503662109375, 0.010820627212524414, 0.011543750762939453, 0.012266874313354492, 0.012989997863769531, 0.01371312141418457, 0.01443624496459961, 0.015159368515014648, 0.015882492065429688, 0.016605615615844727, 0.017328739166259766, 0.018051862716674805, 0.018774986267089844, 0.019498109817504883, 0.020221233367919922, 0.02094435691833496, 0.02166748046875]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 10.0, 32.0, 81.0, 183.0, 249.0, 217.0, 132.0, 65.0, 25.0, 8.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007460244814865291, -0.0007133390172384679, -0.0006806536111980677, -0.0006479681469500065, -0.0006152826827019453, -0.0005825972184538841, -0.0005499117542058229, -0.0005172263481654227, -0.0004845408839173615, -0.0004518554196693003, -0.0004191699845250696, -0.00038648454938083887, -0.0003537990851327777, -0.0003211136208847165, -0.0002884281857404858, -0.00025574275059625506, -0.00022305728634819388, -0.00019037183665204793, -0.00015768638695590198, -0.00012500093725975603, -9.231548756361008e-05, -5.9630037867464125e-05, -2.6944588171318173e-05, 5.740861524827778e-06, 3.842631122097373e-05, 7.111176091711968e-05, 0.00010379721061326563, 0.00013648266030941159, 0.00016916811000555754, 0.0002018535597017035, 0.00023453900939784944, 0.00026722444454208016, 0.00029990996699780226, 0.00033259543124586344, 0.00036528086639009416, 0.0003979663015343249, 0.00043065176578238606, 0.00046333723003044724, 0.0004960226360708475, 0.0005287081003189087, 0.0005613935645669699, 0.000594079028815031, 0.0006267644930630922, 0.0006594498991034925, 0.0006921353633515537, 0.0007248208275996149, 0.0007575062336400151, 0.0007901916978880763, 0.0008228771621361375, 0.0008555626263841987, 0.0008882480906322598, 0.0009209334966726601, 0.0009536189609207213, 0.0009863043669611216, 0.0010189898312091827, 0.001051675295457244, 0.001084360759705305, 0.0011170462239533663, 0.0011497316882014275, 0.0011824171524494886, 0.0012151026166975498, 0.0012477879645302892, 0.0012804734287783504, 0.0013131588930264115, 0.0013458443572744727]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 8.0, 6.0, 4.0, 12.0, 8.0, 8.0, 9.0, 19.0, 24.0, 18.0, 24.0, 28.0, 25.0, 33.0, 25.0, 31.0, 30.0, 38.0, 44.0, 37.0, 41.0, 31.0, 38.0, 35.0, 34.0, 36.0, 31.0, 37.0, 29.0, 38.0, 26.0, 22.0, 27.0, 28.0, 22.0, 16.0, 13.0, 13.0, 12.0, 16.0, 8.0, 5.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00037676095962524414, -0.00036496203392744064, -0.00035316310822963715, -0.00034136418253183365, -0.00032956525683403015, -0.00031776633113622665, -0.00030596740543842316, -0.00029416847974061966, -0.00028236955404281616, -0.00027057062834501266, -0.00025877170264720917, -0.00024697277694940567, -0.00023517385125160217, -0.00022337492555379868, -0.00021157599985599518, -0.00019977707415819168, -0.00018797814846038818, -0.00017617922276258469, -0.0001643802970647812, -0.0001525813713669777, -0.0001407824456691742, -0.0001289835199713707, -0.0001171845942735672, -0.0001053856685757637, -9.35867428779602e-05, -8.178781718015671e-05, -6.998889148235321e-05, -5.818996578454971e-05, -4.6391040086746216e-05, -3.459211438894272e-05, -2.279318869113922e-05, -1.0994262993335724e-05, 8.046627044677734e-07, 1.260358840227127e-05, 2.4402514100074768e-05, 3.6201439797878265e-05, 4.800036549568176e-05, 5.979929119348526e-05, 7.159821689128876e-05, 8.339714258909225e-05, 9.519606828689575e-05, 0.00010699499398469925, 0.00011879391968250275, 0.00013059284538030624, 0.00014239177107810974, 0.00015419069677591324, 0.00016598962247371674, 0.00017778854817152023, 0.00018958747386932373, 0.00020138639956712723, 0.00021318532526493073, 0.00022498425096273422, 0.00023678317666053772, 0.0002485821023583412, 0.0002603810280561447, 0.0002721799537539482, 0.0002839788794517517, 0.0002957778051495552, 0.0003075767308473587, 0.0003193756565451622, 0.0003311745822429657, 0.0003429735079407692, 0.0003547724336385727, 0.0003665713593363762, 0.0003783702850341797]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 5.0, 7.0, 7.0, 8.0, 8.0, 13.0, 8.0, 14.0, 14.0, 14.0, 18.0, 18.0, 23.0, 27.0, 26.0, 28.0, 44.0, 36.0, 35.0, 33.0, 31.0, 35.0, 43.0, 25.0, 32.0, 37.0, 33.0, 44.0, 24.0, 42.0, 27.0, 27.0, 23.0, 25.0, 24.0, 24.0, 18.0, 20.0, 17.0, 18.0, 7.0, 11.0, 7.0, 7.0, 1.0, 9.0, 4.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-5.9921875, -5.81292724609375, -5.6336669921875, -5.45440673828125, -5.275146484375, -5.09588623046875, -4.9166259765625, -4.73736572265625, -4.55810546875, -4.37884521484375, -4.1995849609375, -4.02032470703125, -3.841064453125, -3.66180419921875, -3.4825439453125, -3.30328369140625, -3.1240234375, -2.94476318359375, -2.7655029296875, -2.58624267578125, -2.406982421875, -2.22772216796875, -2.0484619140625, -1.86920166015625, -1.68994140625, -1.51068115234375, -1.3314208984375, -1.15216064453125, -0.972900390625, -0.79364013671875, -0.6143798828125, -0.43511962890625, -0.255859375, -0.07659912109375, 0.1026611328125, 0.28192138671875, 0.461181640625, 0.64044189453125, 0.8197021484375, 0.99896240234375, 1.17822265625, 1.35748291015625, 1.5367431640625, 1.71600341796875, 1.895263671875, 2.07452392578125, 2.2537841796875, 2.43304443359375, 2.6123046875, 2.79156494140625, 2.9708251953125, 3.15008544921875, 3.329345703125, 3.50860595703125, 3.6878662109375, 3.86712646484375, 4.04638671875, 4.22564697265625, 4.4049072265625, 4.58416748046875, 4.763427734375, 4.94268798828125, 5.1219482421875, 5.30120849609375, 5.48046875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 5.0, 2.0, 8.0, 9.0, 14.0, 13.0, 13.0, 18.0, 32.0, 48.0, 79.0, 123.0, 248.0, 450.0, 991.0, 2086.0, 4653.0, 10481.0, 26325.0, 72725.0, 224734.0, 440120.0, 171675.0, 56554.0, 21051.0, 8735.0, 3867.0, 1731.0, 812.0, 414.0, 200.0, 114.0, 68.0, 42.0, 32.0, 17.0, 16.0, 10.0, 15.0, 9.0, 5.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.94921875, -4.79638671875, -4.6435546875, -4.49072265625, -4.337890625, -4.18505859375, -4.0322265625, -3.87939453125, -3.7265625, -3.57373046875, -3.4208984375, -3.26806640625, -3.115234375, -2.96240234375, -2.8095703125, -2.65673828125, -2.50390625, -2.35107421875, -2.1982421875, -2.04541015625, -1.892578125, -1.73974609375, -1.5869140625, -1.43408203125, -1.28125, -1.12841796875, -0.9755859375, -0.82275390625, -0.669921875, -0.51708984375, -0.3642578125, -0.21142578125, -0.05859375, 0.09423828125, 0.2470703125, 0.39990234375, 0.552734375, 0.70556640625, 0.8583984375, 1.01123046875, 1.1640625, 1.31689453125, 1.4697265625, 1.62255859375, 1.775390625, 1.92822265625, 2.0810546875, 2.23388671875, 2.38671875, 2.53955078125, 2.6923828125, 2.84521484375, 2.998046875, 3.15087890625, 3.3037109375, 3.45654296875, 3.609375, 3.76220703125, 3.9150390625, 4.06787109375, 4.220703125, 4.37353515625, 4.5263671875, 4.67919921875, 4.83203125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 6.0, 4.0, 6.0, 6.0, 4.0, 9.0, 10.0, 5.0, 11.0, 7.0, 11.0, 25.0, 21.0, 26.0, 31.0, 20.0, 33.0, 36.0, 48.0, 43.0, 56.0, 85.0, 241.0, 1647.0, 176.0, 64.0, 56.0, 55.0, 46.0, 36.0, 35.0, 26.0, 28.0, 29.0, 17.0, 21.0, 10.0, 10.0, 15.0, 5.0, 5.0, 6.0, 11.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-20.84375, -20.1591796875, -19.474609375, -18.7900390625, -18.10546875, -17.4208984375, -16.736328125, -16.0517578125, -15.3671875, -14.6826171875, -13.998046875, -13.3134765625, -12.62890625, -11.9443359375, -11.259765625, -10.5751953125, -9.890625, -9.2060546875, -8.521484375, -7.8369140625, -7.15234375, -6.4677734375, -5.783203125, -5.0986328125, -4.4140625, -3.7294921875, -3.044921875, -2.3603515625, -1.67578125, -0.9912109375, -0.306640625, 0.3779296875, 1.0625, 1.7470703125, 2.431640625, 3.1162109375, 3.80078125, 4.4853515625, 5.169921875, 5.8544921875, 6.5390625, 7.2236328125, 7.908203125, 8.5927734375, 9.27734375, 9.9619140625, 10.646484375, 11.3310546875, 12.015625, 12.7001953125, 13.384765625, 14.0693359375, 14.75390625, 15.4384765625, 16.123046875, 16.8076171875, 17.4921875, 18.1767578125, 18.861328125, 19.5458984375, 20.23046875, 20.9150390625, 21.599609375, 22.2841796875, 22.96875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 4.0, 1.0, 11.0, 10.0, 8.0, 7.0, 12.0, 13.0, 23.0, 27.0, 34.0, 50.0, 59.0, 72.0, 81.0, 111.0, 207.0, 266.0, 367.0, 918.0, 15891.0, 3107316.0, 17758.0, 1033.0, 407.0, 240.0, 193.0, 122.0, 79.0, 79.0, 68.0, 52.0, 29.0, 39.0, 21.0, 22.0, 10.0, 12.0, 7.0, 14.0, 6.0, 3.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0], "bins": [-55.09375, -53.44970703125, -51.8056640625, -50.16162109375, -48.517578125, -46.87353515625, -45.2294921875, -43.58544921875, -41.94140625, -40.29736328125, -38.6533203125, -37.00927734375, -35.365234375, -33.72119140625, -32.0771484375, -30.43310546875, -28.7890625, -27.14501953125, -25.5009765625, -23.85693359375, -22.212890625, -20.56884765625, -18.9248046875, -17.28076171875, -15.63671875, -13.99267578125, -12.3486328125, -10.70458984375, -9.060546875, -7.41650390625, -5.7724609375, -4.12841796875, -2.484375, -0.84033203125, 0.8037109375, 2.44775390625, 4.091796875, 5.73583984375, 7.3798828125, 9.02392578125, 10.66796875, 12.31201171875, 13.9560546875, 15.60009765625, 17.244140625, 18.88818359375, 20.5322265625, 22.17626953125, 23.8203125, 25.46435546875, 27.1083984375, 28.75244140625, 30.396484375, 32.04052734375, 33.6845703125, 35.32861328125, 36.97265625, 38.61669921875, 40.2607421875, 41.90478515625, 43.548828125, 45.19287109375, 46.8369140625, 48.48095703125, 50.125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [943.0, 74.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.42177677154541, 2.5612010955810547, 15.54417896270752, 28.527156829833984, 41.510135650634766, 54.49311065673828, 67.47608947753906, 80.45906829833984, 93.44204711914062, 106.4250259399414, 119.40800476074219, 132.39097595214844, 145.37396240234375, 158.35693359375, 171.33990478515625, 184.32289123535156, 197.3058624267578, 210.28883361816406, 223.27182006835938, 236.25479125976562, 249.23777770996094, 262.22076416015625, 275.2037353515625, 288.18670654296875, 301.169677734375, 314.15264892578125, 327.1356201171875, 340.1186218261719, 353.1015930175781, 366.0845642089844, 379.0675354003906, 392.050537109375, 405.0335388183594, 418.0165100097656, 430.9994812011719, 443.98248291015625, 456.9654541015625, 469.94842529296875, 482.931396484375, 495.91436767578125, 508.8973693847656, 521.88037109375, 534.8633422851562, 547.8463134765625, 560.8292846679688, 573.812255859375, 586.7952270507812, 599.7781982421875, 612.7611694335938, 625.744140625, 638.7271118164062, 651.7100830078125, 664.6930541992188, 677.676025390625, 690.6590576171875, 703.6420288085938, 716.625, 729.6079711914062, 742.5909423828125, 755.5739135742188, 768.556884765625, 781.5399169921875, 794.5228881835938, 807.505859375, 820.4888305664062]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 4.0, 13.0, 8.0, 9.0, 14.0, 11.0, 20.0, 22.0, 28.0, 20.0, 18.0, 23.0, 28.0, 33.0, 30.0, 41.0, 31.0, 41.0, 28.0, 43.0, 36.0, 42.0, 39.0, 38.0, 32.0, 32.0, 43.0, 41.0, 29.0, 24.0, 24.0, 22.0, 12.0, 24.0, 12.0, 13.0, 12.0, 9.0, 11.0, 7.0, 7.0, 4.0, 8.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-53.863243103027344, -52.18843078613281, -50.51361846923828, -48.838802337646484, -47.16399002075195, -45.48917770385742, -43.814361572265625, -42.139549255371094, -40.46473693847656, -38.78992462158203, -37.1151123046875, -35.4402961730957, -33.76548385620117, -32.09067153930664, -30.415857315063477, -28.741043090820312, -27.06623077392578, -25.39141845703125, -23.716604232788086, -22.041790008544922, -20.36697769165039, -18.69216537475586, -17.017351150512695, -15.342537879943848, -13.667724609375, -11.992911338806152, -10.318098068237305, -8.643284797668457, -6.968471527099609, -5.293658256530762, -3.618844985961914, -1.9440317153930664, -0.26921844482421875, 1.405594825744629, 3.0804080963134766, 4.755221366882324, 6.430034637451172, 8.10484790802002, 9.779661178588867, 11.454474449157715, 13.129287719726562, 14.80410099029541, 16.478914260864258, 18.153728485107422, 19.828540802001953, 21.503353118896484, 23.17816734313965, 24.852981567382812, 26.527793884277344, 28.202606201171875, 29.87742042541504, 31.552234649658203, 33.227046966552734, 34.901859283447266, 36.57667541503906, 38.251487731933594, 39.926300048828125, 41.601112365722656, 43.27592468261719, 44.950740814208984, 46.625553131103516, 48.30036544799805, 49.975181579589844, 51.649993896484375, 53.324806213378906]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 9.0, 7.0, 10.0, 11.0, 7.0, 9.0, 13.0, 18.0, 15.0, 22.0, 22.0, 27.0, 36.0, 30.0, 36.0, 42.0, 28.0, 24.0, 31.0, 30.0, 41.0, 42.0, 29.0, 41.0, 42.0, 39.0, 22.0, 25.0, 39.0, 27.0, 27.0, 17.0, 16.0, 23.0, 24.0, 19.0, 11.0, 19.0, 11.0, 8.0, 12.0, 8.0, 1.0, 7.0, 3.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0], "bins": [-6.3125, -6.129150390625, -5.94580078125, -5.762451171875, -5.5791015625, -5.395751953125, -5.21240234375, -5.029052734375, -4.845703125, -4.662353515625, -4.47900390625, -4.295654296875, -4.1123046875, -3.928955078125, -3.74560546875, -3.562255859375, -3.37890625, -3.195556640625, -3.01220703125, -2.828857421875, -2.6455078125, -2.462158203125, -2.27880859375, -2.095458984375, -1.912109375, -1.728759765625, -1.54541015625, -1.362060546875, -1.1787109375, -0.995361328125, -0.81201171875, -0.628662109375, -0.4453125, -0.261962890625, -0.07861328125, 0.104736328125, 0.2880859375, 0.471435546875, 0.65478515625, 0.838134765625, 1.021484375, 1.204833984375, 1.38818359375, 1.571533203125, 1.7548828125, 1.938232421875, 2.12158203125, 2.304931640625, 2.48828125, 2.671630859375, 2.85498046875, 3.038330078125, 3.2216796875, 3.405029296875, 3.58837890625, 3.771728515625, 3.955078125, 4.138427734375, 4.32177734375, 4.505126953125, 4.6884765625, 4.871826171875, 5.05517578125, 5.238525390625, 5.421875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 7.0, 8.0, 12.0, 7.0, 7.0, 3.0, 8.0, 17.0, 17.0, 23.0, 21.0, 27.0, 37.0, 47.0, 75.0, 84.0, 162.0, 285.0, 617.0, 1451.0, 5384.0, 63653.0, 1801161.0, 2220676.0, 90747.0, 6624.0, 1598.0, 604.0, 296.0, 179.0, 113.0, 72.0, 39.0, 32.0, 22.0, 23.0, 19.0, 13.0, 22.0, 9.0, 22.0, 5.0, 12.0, 6.0, 6.0, 8.0, 6.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-20.140625, -19.53125, -18.921875, -18.3125, -17.703125, -17.09375, -16.484375, -15.875, -15.265625, -14.65625, -14.046875, -13.4375, -12.828125, -12.21875, -11.609375, -11.0, -10.390625, -9.78125, -9.171875, -8.5625, -7.953125, -7.34375, -6.734375, -6.125, -5.515625, -4.90625, -4.296875, -3.6875, -3.078125, -2.46875, -1.859375, -1.25, -0.640625, -0.03125, 0.578125, 1.1875, 1.796875, 2.40625, 3.015625, 3.625, 4.234375, 4.84375, 5.453125, 6.0625, 6.671875, 7.28125, 7.890625, 8.5, 9.109375, 9.71875, 10.328125, 10.9375, 11.546875, 12.15625, 12.765625, 13.375, 13.984375, 14.59375, 15.203125, 15.8125, 16.421875, 17.03125, 17.640625, 18.25, 18.859375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 7.0, 6.0, 12.0, 10.0, 16.0, 25.0, 44.0, 45.0, 96.0, 111.0, 141.0, 230.0, 285.0, 396.0, 500.0, 540.0, 462.0, 363.0, 250.0, 168.0, 117.0, 68.0, 58.0, 38.0, 37.0, 19.0, 13.0, 3.0, 7.0, 7.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.640625, -17.201171875, -16.76171875, -16.322265625, -15.8828125, -15.443359375, -15.00390625, -14.564453125, -14.125, -13.685546875, -13.24609375, -12.806640625, -12.3671875, -11.927734375, -11.48828125, -11.048828125, -10.609375, -10.169921875, -9.73046875, -9.291015625, -8.8515625, -8.412109375, -7.97265625, -7.533203125, -7.09375, -6.654296875, -6.21484375, -5.775390625, -5.3359375, -4.896484375, -4.45703125, -4.017578125, -3.578125, -3.138671875, -2.69921875, -2.259765625, -1.8203125, -1.380859375, -0.94140625, -0.501953125, -0.0625, 0.376953125, 0.81640625, 1.255859375, 1.6953125, 2.134765625, 2.57421875, 3.013671875, 3.453125, 3.892578125, 4.33203125, 4.771484375, 5.2109375, 5.650390625, 6.08984375, 6.529296875, 6.96875, 7.408203125, 7.84765625, 8.287109375, 8.7265625, 9.166015625, 9.60546875, 10.044921875, 10.484375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 7.0, 7.0, 18.0, 18.0, 28.0, 43.0, 65.0, 95.0, 101.0, 122.0, 175.0, 261.0, 390.0, 716.0, 5319.0, 3946443.0, 237203.0, 1506.0, 491.0, 339.0, 216.0, 190.0, 138.0, 98.0, 68.0, 55.0, 50.0, 33.0, 26.0, 21.0, 11.0, 15.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.0, -51.8212890625, -49.642578125, -47.4638671875, -45.28515625, -43.1064453125, -40.927734375, -38.7490234375, -36.5703125, -34.3916015625, -32.212890625, -30.0341796875, -27.85546875, -25.6767578125, -23.498046875, -21.3193359375, -19.140625, -16.9619140625, -14.783203125, -12.6044921875, -10.42578125, -8.2470703125, -6.068359375, -3.8896484375, -1.7109375, 0.4677734375, 2.646484375, 4.8251953125, 7.00390625, 9.1826171875, 11.361328125, 13.5400390625, 15.71875, 17.8974609375, 20.076171875, 22.2548828125, 24.43359375, 26.6123046875, 28.791015625, 30.9697265625, 33.1484375, 35.3271484375, 37.505859375, 39.6845703125, 41.86328125, 44.0419921875, 46.220703125, 48.3994140625, 50.578125, 52.7568359375, 54.935546875, 57.1142578125, 59.29296875, 61.4716796875, 63.650390625, 65.8291015625, 68.0078125, 70.1865234375, 72.365234375, 74.5439453125, 76.72265625, 78.9013671875, 81.080078125, 83.2587890625, 85.4375]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 12.0, 19.0, 61.0, 100.0, 191.0, 181.0, 177.0, 132.0, 59.0, 43.0, 17.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.753108978271484, -56.550594329833984, -54.34807586669922, -52.14556121826172, -49.94304656982422, -47.74053192138672, -45.53801345825195, -43.33549880981445, -41.13298034667969, -38.93046569824219, -36.72794723510742, -34.52543258666992, -32.32291793823242, -30.12040138244629, -27.917884826660156, -25.715370178222656, -23.512855529785156, -21.310338973999023, -19.107824325561523, -16.90530776977539, -14.702792167663574, -12.500276565551758, -10.297760009765625, -8.095244407653809, -5.892728805541992, -3.6902129650115967, -1.4876971244812012, 0.7148189544677734, 2.91733455657959, 5.119850158691406, 7.322366714477539, 9.524882316589355, 11.727401733398438, 13.929917335510254, 16.13243293762207, 18.334949493408203, 20.537464141845703, 22.739980697631836, 24.94249725341797, 27.14501190185547, 29.3475284576416, 31.550045013427734, 33.752559661865234, 35.955078125, 38.1575927734375, 40.360107421875, 42.5626220703125, 44.765140533447266, 46.967655181884766, 49.170169830322266, 51.37268829345703, 53.57520294189453, 55.77771759033203, 57.98023223876953, 60.1827507019043, 62.3852653503418, 64.58778381347656, 66.79029846191406, 68.99281311035156, 71.19532775878906, 73.3978500366211, 75.6003646850586, 77.8028793334961, 80.0053939819336, 82.2079086303711]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 21.0, 14.0, 23.0, 19.0, 18.0, 19.0, 25.0, 25.0, 26.0, 28.0, 29.0, 31.0, 33.0, 32.0, 50.0, 49.0, 43.0, 36.0, 41.0, 37.0, 45.0, 46.0, 41.0, 35.0, 28.0, 23.0, 30.0, 13.0, 21.0, 16.0, 21.0, 12.0, 9.0, 15.0, 5.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.92132568359375, -34.709197998046875, -33.4970703125, -32.284942626953125, -31.07281494140625, -29.860687255859375, -28.6485595703125, -27.436431884765625, -26.22430419921875, -25.012176513671875, -23.800048828125, -22.587921142578125, -21.37579345703125, -20.163665771484375, -18.9515380859375, -17.739410400390625, -16.52728271484375, -15.315155029296875, -14.10302734375, -12.890899658203125, -11.67877197265625, -10.466644287109375, -9.2545166015625, -8.042388916015625, -6.83026123046875, -5.618133544921875, -4.406005859375, -3.193878173828125, -1.98175048828125, -0.769622802734375, 0.4425048828125, 1.654632568359375, 2.86676025390625, 4.078887939453125, 5.291015625, 6.503143310546875, 7.71527099609375, 8.927398681640625, 10.1395263671875, 11.351654052734375, 12.56378173828125, 13.775909423828125, 14.988037109375, 16.200164794921875, 17.41229248046875, 18.624420166015625, 19.8365478515625, 21.048675537109375, 22.26080322265625, 23.472930908203125, 24.68505859375, 25.897186279296875, 27.10931396484375, 28.321441650390625, 29.5335693359375, 30.745697021484375, 31.95782470703125, 33.169952392578125, 34.382080078125, 35.594207763671875, 36.80633544921875, 38.018463134765625, 39.2305908203125, 40.442718505859375, 41.65484619140625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 3.0, 7.0, 7.0, 4.0, 8.0, 16.0, 12.0, 11.0, 15.0, 19.0, 15.0, 21.0, 21.0, 29.0, 38.0, 36.0, 36.0, 39.0, 28.0, 29.0, 30.0, 35.0, 50.0, 35.0, 35.0, 36.0, 31.0, 30.0, 29.0, 35.0, 27.0, 23.0, 29.0, 28.0, 24.0, 11.0, 17.0, 23.0, 15.0, 11.0, 11.0, 6.0, 3.0, 4.0, 5.0, 7.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 3.0], "bins": [-6.140625, -5.95965576171875, -5.7786865234375, -5.59771728515625, -5.416748046875, -5.23577880859375, -5.0548095703125, -4.87384033203125, -4.69287109375, -4.51190185546875, -4.3309326171875, -4.14996337890625, -3.968994140625, -3.78802490234375, -3.6070556640625, -3.42608642578125, -3.2451171875, -3.06414794921875, -2.8831787109375, -2.70220947265625, -2.521240234375, -2.34027099609375, -2.1593017578125, -1.97833251953125, -1.79736328125, -1.61639404296875, -1.4354248046875, -1.25445556640625, -1.073486328125, -0.89251708984375, -0.7115478515625, -0.53057861328125, -0.349609375, -0.16864013671875, 0.0123291015625, 0.19329833984375, 0.374267578125, 0.55523681640625, 0.7362060546875, 0.91717529296875, 1.09814453125, 1.27911376953125, 1.4600830078125, 1.64105224609375, 1.822021484375, 2.00299072265625, 2.1839599609375, 2.36492919921875, 2.5458984375, 2.72686767578125, 2.9078369140625, 3.08880615234375, 3.269775390625, 3.45074462890625, 3.6317138671875, 3.81268310546875, 3.99365234375, 4.17462158203125, 4.3555908203125, 4.53656005859375, 4.717529296875, 4.89849853515625, 5.0794677734375, 5.26043701171875, 5.44140625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 6.0, 7.0, 3.0, 14.0, 27.0, 23.0, 41.0, 70.0, 74.0, 108.0, 144.0, 232.0, 312.0, 437.0, 632.0, 883.0, 1199.0, 1715.0, 2434.0, 3484.0, 5216.0, 7272.0, 10408.0, 15574.0, 23892.0, 36279.0, 55885.0, 91239.0, 182729.0, 282925.0, 120330.0, 70405.0, 44640.0, 28969.0, 19175.0, 12947.0, 8829.0, 6012.0, 4055.0, 2899.0, 2052.0, 1443.0, 1039.0, 729.0, 577.0, 341.0, 279.0, 168.0, 134.0, 106.0, 50.0, 49.0, 30.0, 18.0, 13.0, 9.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.05859375, -1.023590087890625, -0.98858642578125, -0.953582763671875, -0.9185791015625, -0.883575439453125, -0.84857177734375, -0.813568115234375, -0.778564453125, -0.743560791015625, -0.70855712890625, -0.673553466796875, -0.6385498046875, -0.603546142578125, -0.56854248046875, -0.533538818359375, -0.49853515625, -0.463531494140625, -0.42852783203125, -0.393524169921875, -0.3585205078125, -0.323516845703125, -0.28851318359375, -0.253509521484375, -0.218505859375, -0.183502197265625, -0.14849853515625, -0.113494873046875, -0.0784912109375, -0.043487548828125, -0.00848388671875, 0.026519775390625, 0.0615234375, 0.096527099609375, 0.13153076171875, 0.166534423828125, 0.2015380859375, 0.236541748046875, 0.27154541015625, 0.306549072265625, 0.341552734375, 0.376556396484375, 0.41156005859375, 0.446563720703125, 0.4815673828125, 0.516571044921875, 0.55157470703125, 0.586578369140625, 0.62158203125, 0.656585693359375, 0.69158935546875, 0.726593017578125, 0.7615966796875, 0.796600341796875, 0.83160400390625, 0.866607666015625, 0.901611328125, 0.936614990234375, 0.97161865234375, 1.006622314453125, 1.0416259765625, 1.076629638671875, 1.11163330078125, 1.146636962890625, 1.181640625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 8.0, 4.0, 7.0, 10.0, 13.0, 17.0, 10.0, 25.0, 27.0, 26.0, 29.0, 24.0, 32.0, 38.0, 44.0, 26.0, 41.0, 35.0, 37.0, 1083.0, 32.0, 43.0, 36.0, 30.0, 32.0, 35.0, 33.0, 23.0, 39.0, 31.0, 19.0, 28.0, 16.0, 25.0, 12.0, 14.0, 7.0, 9.0, 4.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.73828125, -3.60821533203125, -3.4781494140625, -3.34808349609375, -3.218017578125, -3.08795166015625, -2.9578857421875, -2.82781982421875, -2.69775390625, -2.56768798828125, -2.4376220703125, -2.30755615234375, -2.177490234375, -2.04742431640625, -1.9173583984375, -1.78729248046875, -1.6572265625, -1.52716064453125, -1.3970947265625, -1.26702880859375, -1.136962890625, -1.00689697265625, -0.8768310546875, -0.74676513671875, -0.61669921875, -0.48663330078125, -0.3565673828125, -0.22650146484375, -0.096435546875, 0.03363037109375, 0.1636962890625, 0.29376220703125, 0.423828125, 0.55389404296875, 0.6839599609375, 0.81402587890625, 0.944091796875, 1.07415771484375, 1.2042236328125, 1.33428955078125, 1.46435546875, 1.59442138671875, 1.7244873046875, 1.85455322265625, 1.984619140625, 2.11468505859375, 2.2447509765625, 2.37481689453125, 2.5048828125, 2.63494873046875, 2.7650146484375, 2.89508056640625, 3.025146484375, 3.15521240234375, 3.2852783203125, 3.41534423828125, 3.54541015625, 3.67547607421875, 3.8055419921875, 3.93560791015625, 4.065673828125, 4.19573974609375, 4.3258056640625, 4.45587158203125, 4.5859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 7.0, 16.0, 7.0, 22.0, 32.0, 45.0, 78.0, 126.0, 211.0, 445.0, 828.0, 1558.0, 3056.0, 5914.0, 12205.0, 24665.0, 51306.0, 113415.0, 1422074.0, 277883.0, 96062.0, 44248.0, 21414.0, 10525.0, 5263.0, 2696.0, 1371.0, 746.0, 401.0, 195.0, 112.0, 63.0, 37.0, 31.0, 21.0, 10.0, 6.0, 12.0, 3.0, 7.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.220703125, -2.157073974609375, -2.09344482421875, -2.029815673828125, -1.9661865234375, -1.902557373046875, -1.83892822265625, -1.775299072265625, -1.711669921875, -1.648040771484375, -1.58441162109375, -1.520782470703125, -1.4571533203125, -1.393524169921875, -1.32989501953125, -1.266265869140625, -1.20263671875, -1.139007568359375, -1.07537841796875, -1.011749267578125, -0.9481201171875, -0.884490966796875, -0.82086181640625, -0.757232666015625, -0.693603515625, -0.629974365234375, -0.56634521484375, -0.502716064453125, -0.4390869140625, -0.375457763671875, -0.31182861328125, -0.248199462890625, -0.1845703125, -0.120941162109375, -0.05731201171875, 0.006317138671875, 0.0699462890625, 0.133575439453125, 0.19720458984375, 0.260833740234375, 0.324462890625, 0.388092041015625, 0.45172119140625, 0.515350341796875, 0.5789794921875, 0.642608642578125, 0.70623779296875, 0.769866943359375, 0.83349609375, 0.897125244140625, 0.96075439453125, 1.024383544921875, 1.0880126953125, 1.151641845703125, 1.21527099609375, 1.278900146484375, 1.342529296875, 1.406158447265625, 1.46978759765625, 1.533416748046875, 1.5970458984375, 1.660675048828125, 1.72430419921875, 1.787933349609375, 1.8515625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 7.0, 2.0, 3.0, 3.0, 4.0, 9.0, 12.0, 13.0, 25.0, 28.0, 38.0, 46.0, 59.0, 64.0, 93.0, 81.0, 110.0, 56.0, 69.0, 71.0, 47.0, 39.0, 32.0, 29.0, 14.0, 11.0, 5.0, 10.0, 7.0, 2.0, 2.0, 3.0, 6.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0011205673217773438, -0.0010855644941329956, -0.0010505616664886475, -0.0010155588388442993, -0.0009805560111999512, -0.000945553183555603, -0.0009105503559112549, -0.0008755475282669067, -0.0008405447006225586, -0.0008055418729782104, -0.0007705390453338623, -0.0007355362176895142, -0.000700533390045166, -0.0006655305624008179, -0.0006305277347564697, -0.0005955249071121216, -0.0005605220794677734, -0.0005255192518234253, -0.0004905164241790771, -0.000455513596534729, -0.00042051076889038086, -0.0003855079412460327, -0.00035050511360168457, -0.0003155022859573364, -0.0002804994583129883, -0.00024549663066864014, -0.000210493803024292, -0.00017549097537994385, -0.0001404881477355957, -0.00010548532009124756, -7.048249244689941e-05, -3.547966480255127e-05, -4.76837158203125e-07, 3.452599048614502e-05, 6.952881813049316e-05, 0.00010453164577484131, 0.00013953447341918945, 0.0001745373010635376, 0.00020954012870788574, 0.0002445429563522339, 0.00027954578399658203, 0.0003145486116409302, 0.0003495514392852783, 0.00038455426692962646, 0.0004195570945739746, 0.00045455992221832275, 0.0004895627498626709, 0.000524565577507019, 0.0005595684051513672, 0.0005945712327957153, 0.0006295740604400635, 0.0006645768880844116, 0.0006995797157287598, 0.0007345825433731079, 0.0007695853710174561, 0.0008045881986618042, 0.0008395910263061523, 0.0008745938539505005, 0.0009095966815948486, 0.0009445995092391968, 0.000979602336883545, 0.001014605164527893, 0.0010496079921722412, 0.0010846108198165894, 0.0011196136474609375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 4.0, 9.0, 3.0, 5.0, 17.0, 17.0, 34.0, 32.0, 43.0, 75.0, 89.0, 160.0, 372.0, 3793.0, 1041144.0, 1983.0, 327.0, 135.0, 84.0, 63.0, 35.0, 36.0, 33.0, 13.0, 5.0, 7.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02655029296875, -0.025705575942993164, -0.024860858917236328, -0.024016141891479492, -0.023171424865722656, -0.02232670783996582, -0.021481990814208984, -0.02063727378845215, -0.019792556762695312, -0.018947839736938477, -0.01810312271118164, -0.017258405685424805, -0.01641368865966797, -0.015568971633911133, -0.014724254608154297, -0.013879537582397461, -0.013034820556640625, -0.012190103530883789, -0.011345386505126953, -0.010500669479370117, -0.009655952453613281, -0.008811235427856445, -0.00796651840209961, -0.0071218013763427734, -0.0062770843505859375, -0.0054323673248291016, -0.004587650299072266, -0.0037429332733154297, -0.0028982162475585938, -0.002053499221801758, -0.0012087821960449219, -0.00036406517028808594, 0.00048065185546875, 0.001325368881225586, 0.002170085906982422, 0.003014802932739258, 0.0038595199584960938, 0.00470423698425293, 0.005548954010009766, 0.0063936710357666016, 0.0072383880615234375, 0.008083105087280273, 0.00892782211303711, 0.009772539138793945, 0.010617256164550781, 0.011461973190307617, 0.012306690216064453, 0.013151407241821289, 0.013996124267578125, 0.014840841293334961, 0.015685558319091797, 0.016530275344848633, 0.01737499237060547, 0.018219709396362305, 0.01906442642211914, 0.019909143447875977, 0.020753860473632812, 0.02159857749938965, 0.022443294525146484, 0.02328801155090332, 0.024132728576660156, 0.024977445602416992, 0.025822162628173828, 0.026666879653930664, 0.0275115966796875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 45.0, 192.0, 367.0, 282.0, 104.0, 17.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0027580843307077885, -0.002707783132791519, -0.00265748193487525, -0.0026071807369589806, -0.0025568795390427113, -0.002506578341126442, -0.0024562771432101727, -0.0024059759452939034, -0.002355674747377634, -0.0023053735494613647, -0.0022550723515450954, -0.002204771153628826, -0.002154469955712557, -0.0021041687577962875, -0.0020538675598800182, -0.002003566361963749, -0.001953264931216836, -0.0019029637333005667, -0.0018526625353842974, -0.001802361337468028, -0.0017520601395517588, -0.0017017589416354895, -0.0016514576273038983, -0.001601156429387629, -0.0015508552314713597, -0.0015005540335550904, -0.0014502528356388211, -0.0013999516377225518, -0.0013496503233909607, -0.0012993491254746914, -0.001249047927558422, -0.0011987467296421528, -0.0011484455317258835, -0.0010981443338096142, -0.0010478431358933449, -0.0009975419379770756, -0.0009472406818531454, -0.0008969394839368761, -0.0008466382278129458, -0.0007963370298966765, -0.0007460358319804072, -0.0006957346340641379, -0.0006454334361478686, -0.0005951321800239384, -0.0005448309821076691, -0.0004945297841913998, -0.00044422855717130005, -0.0003939273301512003, -0.000343626132234931, -0.0002933249343186617, -0.00024302370729856193, -0.0001927224948303774, -0.00014242128236219287, -9.212008444592357e-05, -4.181885742582381e-05, 8.482369594275951e-06, 5.8783567510545254e-05, 0.00010908477997872978, 0.00015938599244691432, 0.00020968720491509885, 0.0002599884173832834, 0.0003102896152995527, 0.00036059084231965244, 0.0004108920693397522, 0.0004611932672560215]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 3.0, 10.0, 6.0, 5.0, 8.0, 14.0, 19.0, 17.0, 20.0, 24.0, 27.0, 20.0, 27.0, 30.0, 35.0, 35.0, 31.0, 37.0, 40.0, 61.0, 35.0, 40.0, 47.0, 47.0, 32.0, 37.0, 31.0, 38.0, 20.0, 35.0, 33.0, 14.0, 17.0, 20.0, 20.0, 15.0, 7.0, 6.0, 10.0, 6.0, 6.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00046241283416748047, -0.00044815242290496826, -0.00043389201164245605, -0.00041963160037994385, -0.00040537118911743164, -0.00039111077785491943, -0.0003768503665924072, -0.000362589955329895, -0.0003483295440673828, -0.0003340691328048706, -0.0003198087215423584, -0.0003055483102798462, -0.000291287899017334, -0.0002770274877548218, -0.00026276707649230957, -0.00024850666522979736, -0.00023424625396728516, -0.00021998584270477295, -0.00020572543144226074, -0.00019146502017974854, -0.00017720460891723633, -0.00016294419765472412, -0.00014868378639221191, -0.0001344233751296997, -0.0001201629638671875, -0.00010590255260467529, -9.164214134216309e-05, -7.738173007965088e-05, -6.312131881713867e-05, -4.8860907554626465e-05, -3.460049629211426e-05, -2.034008502960205e-05, -6.079673767089844e-06, 8.180737495422363e-06, 2.244114875793457e-05, 3.670156002044678e-05, 5.0961971282958984e-05, 6.522238254547119e-05, 7.94827938079834e-05, 9.37432050704956e-05, 0.00010800361633300781, 0.00012226402759552002, 0.00013652443885803223, 0.00015078485012054443, 0.00016504526138305664, 0.00017930567264556885, 0.00019356608390808105, 0.00020782649517059326, 0.00022208690643310547, 0.00023634731769561768, 0.0002506077289581299, 0.0002648681402206421, 0.0002791285514831543, 0.0002933889627456665, 0.0003076493740081787, 0.0003219097852706909, 0.0003361701965332031, 0.00035043060779571533, 0.00036469101905822754, 0.00037895143032073975, 0.00039321184158325195, 0.00040747225284576416, 0.00042173266410827637, 0.0004359930753707886, 0.0004502534866333008]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 6.0, 5.0, 3.0, 7.0, 7.0, 4.0, 8.0, 16.0, 12.0, 11.0, 15.0, 19.0, 15.0, 21.0, 21.0, 29.0, 38.0, 36.0, 37.0, 38.0, 28.0, 29.0, 30.0, 35.0, 50.0, 35.0, 35.0, 36.0, 31.0, 30.0, 29.0, 35.0, 27.0, 23.0, 29.0, 28.0, 24.0, 11.0, 17.0, 23.0, 15.0, 11.0, 11.0, 6.0, 3.0, 4.0, 5.0, 7.0, 6.0, 2.0, 5.0, 4.0, 0.0, 2.0, 3.0], "bins": [-6.140625, -5.95965576171875, -5.7786865234375, -5.59771728515625, -5.416748046875, -5.23577880859375, -5.0548095703125, -4.87384033203125, -4.69287109375, -4.51190185546875, -4.3309326171875, -4.14996337890625, -3.968994140625, -3.78802490234375, -3.6070556640625, -3.42608642578125, -3.2451171875, -3.06414794921875, -2.8831787109375, -2.70220947265625, -2.521240234375, -2.34027099609375, -2.1593017578125, -1.97833251953125, -1.79736328125, -1.61639404296875, -1.4354248046875, -1.25445556640625, -1.073486328125, -0.89251708984375, -0.7115478515625, -0.53057861328125, -0.349609375, -0.16864013671875, 0.0123291015625, 0.19329833984375, 0.374267578125, 0.55523681640625, 0.7362060546875, 0.91717529296875, 1.09814453125, 1.27911376953125, 1.4600830078125, 1.64105224609375, 1.822021484375, 2.00299072265625, 2.1839599609375, 2.36492919921875, 2.5458984375, 2.72686767578125, 2.9078369140625, 3.08880615234375, 3.269775390625, 3.45074462890625, 3.6317138671875, 3.81268310546875, 3.99365234375, 4.17462158203125, 4.3555908203125, 4.53656005859375, 4.717529296875, 4.89849853515625, 5.0794677734375, 5.26043701171875, 5.44140625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 8.0, 1.0, 9.0, 15.0, 29.0, 18.0, 33.0, 35.0, 51.0, 46.0, 77.0, 103.0, 119.0, 205.0, 296.0, 521.0, 1034.0, 2300.0, 5614.0, 15362.0, 47294.0, 154109.0, 480399.0, 234969.0, 69281.0, 22597.0, 7839.0, 2988.0, 1340.0, 658.0, 341.0, 228.0, 155.0, 114.0, 76.0, 51.0, 46.0, 35.0, 50.0, 17.0, 23.0, 19.0, 9.0, 9.0, 3.0, 6.0, 6.0, 3.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0], "bins": [-6.5, -6.301025390625, -6.10205078125, -5.903076171875, -5.7041015625, -5.505126953125, -5.30615234375, -5.107177734375, -4.908203125, -4.709228515625, -4.51025390625, -4.311279296875, -4.1123046875, -3.913330078125, -3.71435546875, -3.515380859375, -3.31640625, -3.117431640625, -2.91845703125, -2.719482421875, -2.5205078125, -2.321533203125, -2.12255859375, -1.923583984375, -1.724609375, -1.525634765625, -1.32666015625, -1.127685546875, -0.9287109375, -0.729736328125, -0.53076171875, -0.331787109375, -0.1328125, 0.066162109375, 0.26513671875, 0.464111328125, 0.6630859375, 0.862060546875, 1.06103515625, 1.260009765625, 1.458984375, 1.657958984375, 1.85693359375, 2.055908203125, 2.2548828125, 2.453857421875, 2.65283203125, 2.851806640625, 3.05078125, 3.249755859375, 3.44873046875, 3.647705078125, 3.8466796875, 4.045654296875, 4.24462890625, 4.443603515625, 4.642578125, 4.841552734375, 5.04052734375, 5.239501953125, 5.4384765625, 5.637451171875, 5.83642578125, 6.035400390625, 6.234375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 14.0, 11.0, 11.0, 13.0, 17.0, 21.0, 30.0, 33.0, 41.0, 45.0, 43.0, 36.0, 62.0, 80.0, 271.0, 1677.0, 165.0, 72.0, 50.0, 49.0, 56.0, 38.0, 36.0, 29.0, 31.0, 25.0, 17.0, 9.0, 12.0, 13.0, 6.0, 4.0, 11.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-24.75, -24.006591796875, -23.26318359375, -22.519775390625, -21.7763671875, -21.032958984375, -20.28955078125, -19.546142578125, -18.802734375, -18.059326171875, -17.31591796875, -16.572509765625, -15.8291015625, -15.085693359375, -14.34228515625, -13.598876953125, -12.85546875, -12.112060546875, -11.36865234375, -10.625244140625, -9.8818359375, -9.138427734375, -8.39501953125, -7.651611328125, -6.908203125, -6.164794921875, -5.42138671875, -4.677978515625, -3.9345703125, -3.191162109375, -2.44775390625, -1.704345703125, -0.9609375, -0.217529296875, 0.52587890625, 1.269287109375, 2.0126953125, 2.756103515625, 3.49951171875, 4.242919921875, 4.986328125, 5.729736328125, 6.47314453125, 7.216552734375, 7.9599609375, 8.703369140625, 9.44677734375, 10.190185546875, 10.93359375, 11.677001953125, 12.42041015625, 13.163818359375, 13.9072265625, 14.650634765625, 15.39404296875, 16.137451171875, 16.880859375, 17.624267578125, 18.36767578125, 19.111083984375, 19.8544921875, 20.597900390625, 21.34130859375, 22.084716796875, 22.828125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 11.0, 17.0, 18.0, 18.0, 33.0, 34.0, 56.0, 71.0, 103.0, 156.0, 165.0, 312.0, 601.0, 2276.0, 2712387.0, 426337.0, 1638.0, 543.0, 289.0, 190.0, 121.0, 84.0, 49.0, 46.0, 24.0, 29.0, 18.0, 17.0, 12.0, 7.0, 4.0, 3.0, 6.0, 3.0, 1.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.0625, -65.142578125, -63.22265625, -61.302734375, -59.3828125, -57.462890625, -55.54296875, -53.623046875, -51.703125, -49.783203125, -47.86328125, -45.943359375, -44.0234375, -42.103515625, -40.18359375, -38.263671875, -36.34375, -34.423828125, -32.50390625, -30.583984375, -28.6640625, -26.744140625, -24.82421875, -22.904296875, -20.984375, -19.064453125, -17.14453125, -15.224609375, -13.3046875, -11.384765625, -9.46484375, -7.544921875, -5.625, -3.705078125, -1.78515625, 0.134765625, 2.0546875, 3.974609375, 5.89453125, 7.814453125, 9.734375, 11.654296875, 13.57421875, 15.494140625, 17.4140625, 19.333984375, 21.25390625, 23.173828125, 25.09375, 27.013671875, 28.93359375, 30.853515625, 32.7734375, 34.693359375, 36.61328125, 38.533203125, 40.453125, 42.373046875, 44.29296875, 46.212890625, 48.1328125, 50.052734375, 51.97265625, 53.892578125, 55.8125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 8.0, 962.0, 48.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.508975982666016, -27.757720947265625, -20.006465911865234, -12.255208969116211, -4.50395393371582, 3.247303009033203, 10.998558044433594, 18.749813079833984, 26.501068115234375, 34.252323150634766, 42.003578186035156, 49.75483703613281, 57.50608825683594, 65.2573471069336, 73.00860595703125, 80.75985717773438, 88.5111083984375, 96.26236724853516, 104.01361846923828, 111.76487731933594, 119.51612854003906, 127.26738739013672, 135.01864624023438, 142.7698974609375, 150.52114868164062, 158.27239990234375, 166.02366638183594, 173.77491760253906, 181.5261688232422, 189.27743530273438, 197.0286865234375, 204.77993774414062, 212.5312042236328, 220.28245544433594, 228.03372192382812, 235.78497314453125, 243.53622436523438, 251.2874755859375, 259.0387268066406, 266.78997802734375, 274.541259765625, 282.2925109863281, 290.04376220703125, 297.7950134277344, 305.5462951660156, 313.29754638671875, 321.0487976074219, 328.800048828125, 336.5513000488281, 344.30255126953125, 352.0538024902344, 359.8050537109375, 367.55633544921875, 375.3075866699219, 383.058837890625, 390.8100891113281, 398.56134033203125, 406.3125915527344, 414.0638427734375, 421.8150939941406, 429.5663757324219, 437.317626953125, 445.0688781738281, 452.82012939453125, 460.5713806152344]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 10.0, 8.0, 13.0, 11.0, 13.0, 16.0, 16.0, 20.0, 19.0, 30.0, 28.0, 27.0, 30.0, 38.0, 30.0, 46.0, 34.0, 33.0, 47.0, 39.0, 41.0, 43.0, 36.0, 34.0, 35.0, 38.0, 38.0, 35.0, 25.0, 28.0, 16.0, 25.0, 13.0, 16.0, 11.0, 14.0, 10.0, 6.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.734291076660156, -49.07063674926758, -47.406986236572266, -45.74333190917969, -44.079681396484375, -42.4160270690918, -40.75237274169922, -39.088722229003906, -37.42506790161133, -35.76141357421875, -34.09776306152344, -32.43410873413086, -30.770456314086914, -29.10680389404297, -27.443151473999023, -25.779499053955078, -24.115846633911133, -22.452194213867188, -20.788541793823242, -19.124889373779297, -17.46123504638672, -15.797582626342773, -14.133930206298828, -12.470276832580566, -10.806624412536621, -9.142971992492676, -7.479318618774414, -5.815666198730469, -4.152013301849365, -2.4883604049682617, -0.8247079849243164, 0.8389453887939453, 2.5025978088378906, 4.166250705718994, 5.829903602600098, 7.493556022644043, 9.157209396362305, 10.82086181640625, 12.484514236450195, 14.148167610168457, 15.811820030212402, 17.475473403930664, 19.13912582397461, 20.802778244018555, 22.4664306640625, 24.130084991455078, 25.79373550415039, 27.45738983154297, 29.121042251586914, 30.78469467163086, 32.44834899902344, 34.11199951171875, 35.77565383911133, 37.439308166503906, 39.10295867919922, 40.7666130065918, 42.43026351928711, 44.09391784667969, 45.757568359375, 47.42122268676758, 49.08487319946289, 50.74852752685547, 52.41217803955078, 54.07583236694336, 55.73948669433594]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 10.0, 5.0, 4.0, 6.0, 9.0, 9.0, 13.0, 9.0, 14.0, 13.0, 21.0, 26.0, 17.0, 26.0, 28.0, 36.0, 39.0, 23.0, 33.0, 43.0, 40.0, 32.0, 35.0, 30.0, 37.0, 40.0, 33.0, 36.0, 29.0, 34.0, 29.0, 34.0, 29.0, 23.0, 23.0, 20.0, 19.0, 12.0, 11.0, 20.0, 10.0, 11.0, 4.0, 4.0, 3.0, 7.0, 7.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.21875, -6.02764892578125, -5.8365478515625, -5.64544677734375, -5.454345703125, -5.26324462890625, -5.0721435546875, -4.88104248046875, -4.68994140625, -4.49884033203125, -4.3077392578125, -4.11663818359375, -3.925537109375, -3.73443603515625, -3.5433349609375, -3.35223388671875, -3.1611328125, -2.97003173828125, -2.7789306640625, -2.58782958984375, -2.396728515625, -2.20562744140625, -2.0145263671875, -1.82342529296875, -1.63232421875, -1.44122314453125, -1.2501220703125, -1.05902099609375, -0.867919921875, -0.67681884765625, -0.4857177734375, -0.29461669921875, -0.103515625, 0.08758544921875, 0.2786865234375, 0.46978759765625, 0.660888671875, 0.85198974609375, 1.0430908203125, 1.23419189453125, 1.42529296875, 1.61639404296875, 1.8074951171875, 1.99859619140625, 2.189697265625, 2.38079833984375, 2.5718994140625, 2.76300048828125, 2.9541015625, 3.14520263671875, 3.3363037109375, 3.52740478515625, 3.718505859375, 3.90960693359375, 4.1007080078125, 4.29180908203125, 4.48291015625, 4.67401123046875, 4.8651123046875, 5.05621337890625, 5.247314453125, 5.43841552734375, 5.6295166015625, 5.82061767578125, 6.01171875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 5.0, 9.0, 11.0, 8.0, 5.0, 12.0, 15.0, 15.0, 22.0, 24.0, 26.0, 30.0, 33.0, 52.0, 77.0, 98.0, 135.0, 196.0, 321.0, 604.0, 1767.0, 11625.0, 316450.0, 3311879.0, 530165.0, 16674.0, 2277.0, 640.0, 311.0, 181.0, 133.0, 112.0, 60.0, 64.0, 51.0, 35.0, 34.0, 24.0, 16.0, 14.0, 14.0, 13.0, 10.0, 6.0, 3.0, 8.0, 3.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0], "bins": [-21.40625, -20.7490234375, -20.091796875, -19.4345703125, -18.77734375, -18.1201171875, -17.462890625, -16.8056640625, -16.1484375, -15.4912109375, -14.833984375, -14.1767578125, -13.51953125, -12.8623046875, -12.205078125, -11.5478515625, -10.890625, -10.2333984375, -9.576171875, -8.9189453125, -8.26171875, -7.6044921875, -6.947265625, -6.2900390625, -5.6328125, -4.9755859375, -4.318359375, -3.6611328125, -3.00390625, -2.3466796875, -1.689453125, -1.0322265625, -0.375, 0.2822265625, 0.939453125, 1.5966796875, 2.25390625, 2.9111328125, 3.568359375, 4.2255859375, 4.8828125, 5.5400390625, 6.197265625, 6.8544921875, 7.51171875, 8.1689453125, 8.826171875, 9.4833984375, 10.140625, 10.7978515625, 11.455078125, 12.1123046875, 12.76953125, 13.4267578125, 14.083984375, 14.7412109375, 15.3984375, 16.0556640625, 16.712890625, 17.3701171875, 18.02734375, 18.6845703125, 19.341796875, 19.9990234375, 20.65625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 8.0, 14.0, 23.0, 44.0, 50.0, 80.0, 123.0, 175.0, 269.0, 420.0, 572.0, 649.0, 580.0, 376.0, 227.0, 171.0, 95.0, 56.0, 45.0, 20.0, 19.0, 19.0, 11.0, 8.0, 5.0, 7.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.53125, -21.9990234375, -21.466796875, -20.9345703125, -20.40234375, -19.8701171875, -19.337890625, -18.8056640625, -18.2734375, -17.7412109375, -17.208984375, -16.6767578125, -16.14453125, -15.6123046875, -15.080078125, -14.5478515625, -14.015625, -13.4833984375, -12.951171875, -12.4189453125, -11.88671875, -11.3544921875, -10.822265625, -10.2900390625, -9.7578125, -9.2255859375, -8.693359375, -8.1611328125, -7.62890625, -7.0966796875, -6.564453125, -6.0322265625, -5.5, -4.9677734375, -4.435546875, -3.9033203125, -3.37109375, -2.8388671875, -2.306640625, -1.7744140625, -1.2421875, -0.7099609375, -0.177734375, 0.3544921875, 0.88671875, 1.4189453125, 1.951171875, 2.4833984375, 3.015625, 3.5478515625, 4.080078125, 4.6123046875, 5.14453125, 5.6767578125, 6.208984375, 6.7412109375, 7.2734375, 7.8056640625, 8.337890625, 8.8701171875, 9.40234375, 9.9345703125, 10.466796875, 10.9990234375, 11.53125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 5.0, 7.0, 10.0, 15.0, 25.0, 28.0, 29.0, 56.0, 81.0, 110.0, 203.0, 253.0, 373.0, 704.0, 5018.0, 4130709.0, 54291.0, 972.0, 438.0, 284.0, 195.0, 164.0, 94.0, 82.0, 48.0, 42.0, 21.0, 13.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.9375, -57.0390625, -54.140625, -51.2421875, -48.34375, -45.4453125, -42.546875, -39.6484375, -36.75, -33.8515625, -30.953125, -28.0546875, -25.15625, -22.2578125, -19.359375, -16.4609375, -13.5625, -10.6640625, -7.765625, -4.8671875, -1.96875, 0.9296875, 3.828125, 6.7265625, 9.625, 12.5234375, 15.421875, 18.3203125, 21.21875, 24.1171875, 27.015625, 29.9140625, 32.8125, 35.7109375, 38.609375, 41.5078125, 44.40625, 47.3046875, 50.203125, 53.1015625, 56.0, 58.8984375, 61.796875, 64.6953125, 67.59375, 70.4921875, 73.390625, 76.2890625, 79.1875, 82.0859375, 84.984375, 87.8828125, 90.78125, 93.6796875, 96.578125, 99.4765625, 102.375, 105.2734375, 108.171875, 111.0703125, 113.96875, 116.8671875, 119.765625, 122.6640625, 125.5625]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 5.0, 45.0, 149.0, 403.0, 319.0, 85.0, 11.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.12209129333496, -19.851913452148438, -14.581737518310547, -9.31156063079834, -4.041383743286133, 1.2287921905517578, 6.498970031738281, 11.769147872924805, 17.039323806762695, 22.30950164794922, 27.57967758178711, 32.849853515625, 38.120033264160156, 43.39020538330078, 48.66038513183594, 53.930564880371094, 59.20073699951172, 64.47091674804688, 69.7410888671875, 75.01126861572266, 80.28144836425781, 85.55162048339844, 90.8218002319336, 96.09197998046875, 101.36215209960938, 106.63233184814453, 111.90250396728516, 117.17268371582031, 122.44285583496094, 127.7130355834961, 132.98321533203125, 138.25338745117188, 143.5235595703125, 148.79373168945312, 154.0639190673828, 159.33409118652344, 164.60426330566406, 169.87445068359375, 175.14462280273438, 180.414794921875, 185.68496704101562, 190.95513916015625, 196.22532653808594, 201.49549865722656, 206.7656707763672, 212.03585815429688, 217.3060302734375, 222.57620239257812, 227.8463897705078, 233.11656188964844, 238.38674926757812, 243.65692138671875, 248.92709350585938, 254.197265625, 259.4674377441406, 264.7376403808594, 270.0078125, 275.2779846191406, 280.54815673828125, 285.8183288574219, 291.0885314941406, 296.35870361328125, 301.6288757324219, 306.8990478515625, 312.1692199707031]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 0.0, 4.0, 6.0, 4.0, 6.0, 12.0, 14.0, 13.0, 15.0, 28.0, 25.0, 28.0, 34.0, 35.0, 34.0, 43.0, 42.0, 60.0, 49.0, 50.0, 53.0, 55.0, 40.0, 36.0, 42.0, 38.0, 29.0, 38.0, 41.0, 20.0, 19.0, 18.0, 21.0, 13.0, 16.0, 7.0, 7.0, 4.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.19474792480469, -44.745391845703125, -43.29603576660156, -41.8466796875, -40.39732360839844, -38.947967529296875, -37.49861145019531, -36.04925537109375, -34.59989929199219, -33.150543212890625, -31.701187133789062, -30.2518310546875, -28.802474975585938, -27.353118896484375, -25.903762817382812, -24.45440673828125, -23.005050659179688, -21.555694580078125, -20.106338500976562, -18.656982421875, -17.207626342773438, -15.758270263671875, -14.308914184570312, -12.85955810546875, -11.410202026367188, -9.960845947265625, -8.511489868164062, -7.0621337890625, -5.6127777099609375, -4.163421630859375, -2.7140655517578125, -1.26470947265625, 0.1846466064453125, 1.634002685546875, 3.0833587646484375, 4.53271484375, 5.9820709228515625, 7.431427001953125, 8.880783081054688, 10.33013916015625, 11.779495239257812, 13.228851318359375, 14.678207397460938, 16.1275634765625, 17.576919555664062, 19.026275634765625, 20.475631713867188, 21.92498779296875, 23.374343872070312, 24.823699951171875, 26.273056030273438, 27.722412109375, 29.171768188476562, 30.621124267578125, 32.07048034667969, 33.51983642578125, 34.96919250488281, 36.418548583984375, 37.86790466308594, 39.3172607421875, 40.76661682128906, 42.215972900390625, 43.66532897949219, 45.11468505859375, 46.56404113769531]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 8.0, 3.0, 15.0, 10.0, 21.0, 21.0, 20.0, 21.0, 23.0, 19.0, 31.0, 30.0, 26.0, 35.0, 37.0, 33.0, 24.0, 36.0, 48.0, 33.0, 33.0, 34.0, 28.0, 41.0, 31.0, 39.0, 34.0, 26.0, 28.0, 25.0, 21.0, 24.0, 17.0, 12.0, 15.0, 15.0, 13.0, 6.0, 4.0, 12.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.81640625, -5.62738037109375, -5.4383544921875, -5.24932861328125, -5.060302734375, -4.87127685546875, -4.6822509765625, -4.49322509765625, -4.30419921875, -4.11517333984375, -3.9261474609375, -3.73712158203125, -3.548095703125, -3.35906982421875, -3.1700439453125, -2.98101806640625, -2.7919921875, -2.60296630859375, -2.4139404296875, -2.22491455078125, -2.035888671875, -1.84686279296875, -1.6578369140625, -1.46881103515625, -1.27978515625, -1.09075927734375, -0.9017333984375, -0.71270751953125, -0.523681640625, -0.33465576171875, -0.1456298828125, 0.04339599609375, 0.232421875, 0.42144775390625, 0.6104736328125, 0.79949951171875, 0.988525390625, 1.17755126953125, 1.3665771484375, 1.55560302734375, 1.74462890625, 1.93365478515625, 2.1226806640625, 2.31170654296875, 2.500732421875, 2.68975830078125, 2.8787841796875, 3.06781005859375, 3.2568359375, 3.44586181640625, 3.6348876953125, 3.82391357421875, 4.012939453125, 4.20196533203125, 4.3909912109375, 4.58001708984375, 4.76904296875, 4.95806884765625, 5.1470947265625, 5.33612060546875, 5.525146484375, 5.71417236328125, 5.9031982421875, 6.09222412109375, 6.28125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [8.0, 6.0, 12.0, 18.0, 18.0, 51.0, 52.0, 81.0, 94.0, 124.0, 160.0, 261.0, 337.0, 459.0, 624.0, 777.0, 1150.0, 1613.0, 2260.0, 2923.0, 4309.0, 5915.0, 7992.0, 11487.0, 16465.0, 23618.0, 34413.0, 51594.0, 80071.0, 135137.0, 252932.0, 150511.0, 85624.0, 55144.0, 36882.0, 25039.0, 17534.0, 12219.0, 8418.0, 6199.0, 4453.0, 3065.0, 2202.0, 1756.0, 1217.0, 845.0, 646.0, 475.0, 405.0, 268.0, 209.0, 130.0, 108.0, 80.0, 64.0, 32.0, 35.0, 28.0, 13.0, 8.0, 1.0, 2.0, 2.0, 1.0], "bins": [-1.0087890625, -0.975799560546875, -0.94281005859375, -0.909820556640625, -0.8768310546875, -0.843841552734375, -0.81085205078125, -0.777862548828125, -0.744873046875, -0.711883544921875, -0.67889404296875, -0.645904541015625, -0.6129150390625, -0.579925537109375, -0.54693603515625, -0.513946533203125, -0.48095703125, -0.447967529296875, -0.41497802734375, -0.381988525390625, -0.3489990234375, -0.316009521484375, -0.28302001953125, -0.250030517578125, -0.217041015625, -0.184051513671875, -0.15106201171875, -0.118072509765625, -0.0850830078125, -0.052093505859375, -0.01910400390625, 0.013885498046875, 0.046875, 0.079864501953125, 0.11285400390625, 0.145843505859375, 0.1788330078125, 0.211822509765625, 0.24481201171875, 0.277801513671875, 0.310791015625, 0.343780517578125, 0.37677001953125, 0.409759521484375, 0.4427490234375, 0.475738525390625, 0.50872802734375, 0.541717529296875, 0.57470703125, 0.607696533203125, 0.64068603515625, 0.673675537109375, 0.7066650390625, 0.739654541015625, 0.77264404296875, 0.805633544921875, 0.838623046875, 0.871612548828125, 0.90460205078125, 0.937591552734375, 0.9705810546875, 1.003570556640625, 1.03656005859375, 1.069549560546875, 1.1025390625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 4.0, 4.0, 10.0, 18.0, 8.0, 11.0, 11.0, 20.0, 21.0, 19.0, 31.0, 20.0, 21.0, 24.0, 35.0, 29.0, 42.0, 33.0, 37.0, 42.0, 31.0, 1064.0, 43.0, 27.0, 32.0, 36.0, 31.0, 35.0, 41.0, 28.0, 24.0, 26.0, 23.0, 19.0, 20.0, 16.0, 15.0, 10.0, 17.0, 8.0, 12.0, 7.0, 4.0, 6.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.66015625, -3.5338134765625, -3.407470703125, -3.2811279296875, -3.15478515625, -3.0284423828125, -2.902099609375, -2.7757568359375, -2.6494140625, -2.5230712890625, -2.396728515625, -2.2703857421875, -2.14404296875, -2.0177001953125, -1.891357421875, -1.7650146484375, -1.638671875, -1.5123291015625, -1.385986328125, -1.2596435546875, -1.13330078125, -1.0069580078125, -0.880615234375, -0.7542724609375, -0.6279296875, -0.5015869140625, -0.375244140625, -0.2489013671875, -0.12255859375, 0.0037841796875, 0.130126953125, 0.2564697265625, 0.3828125, 0.5091552734375, 0.635498046875, 0.7618408203125, 0.88818359375, 1.0145263671875, 1.140869140625, 1.2672119140625, 1.3935546875, 1.5198974609375, 1.646240234375, 1.7725830078125, 1.89892578125, 2.0252685546875, 2.151611328125, 2.2779541015625, 2.404296875, 2.5306396484375, 2.656982421875, 2.7833251953125, 2.90966796875, 3.0360107421875, 3.162353515625, 3.2886962890625, 3.4150390625, 3.5413818359375, 3.667724609375, 3.7940673828125, 3.92041015625, 4.0467529296875, 4.173095703125, 4.2994384765625, 4.42578125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 4.0, 6.0, 6.0, 13.0, 15.0, 17.0, 16.0, 31.0, 49.0, 82.0, 175.0, 295.0, 574.0, 1079.0, 1998.0, 3590.0, 6803.0, 12624.0, 23633.0, 45250.0, 93384.0, 249717.0, 1419047.0, 120649.0, 56043.0, 28895.0, 15345.0, 8162.0, 4385.0, 2387.0, 1269.0, 683.0, 395.0, 193.0, 115.0, 52.0, 44.0, 32.0, 11.0, 11.0, 15.0, 11.0, 8.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.080078125, -2.0191802978515625, -1.958282470703125, -1.8973846435546875, -1.83648681640625, -1.7755889892578125, -1.714691162109375, -1.6537933349609375, -1.5928955078125, -1.5319976806640625, -1.471099853515625, -1.4102020263671875, -1.34930419921875, -1.2884063720703125, -1.227508544921875, -1.1666107177734375, -1.105712890625, -1.0448150634765625, -0.983917236328125, -0.9230194091796875, -0.86212158203125, -0.8012237548828125, -0.740325927734375, -0.6794281005859375, -0.6185302734375, -0.5576324462890625, -0.496734619140625, -0.4358367919921875, -0.37493896484375, -0.3140411376953125, -0.253143310546875, -0.1922454833984375, -0.13134765625, -0.0704498291015625, -0.009552001953125, 0.0513458251953125, 0.11224365234375, 0.1731414794921875, 0.234039306640625, 0.2949371337890625, 0.3558349609375, 0.4167327880859375, 0.477630615234375, 0.5385284423828125, 0.59942626953125, 0.6603240966796875, 0.721221923828125, 0.7821197509765625, 0.843017578125, 0.9039154052734375, 0.964813232421875, 1.0257110595703125, 1.08660888671875, 1.1475067138671875, 1.208404541015625, 1.2693023681640625, 1.3302001953125, 1.3910980224609375, 1.451995849609375, 1.5128936767578125, 1.57379150390625, 1.6346893310546875, 1.695587158203125, 1.7564849853515625, 1.8173828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 4.0, 14.0, 5.0, 9.0, 9.0, 13.0, 17.0, 18.0, 20.0, 20.0, 32.0, 33.0, 47.0, 55.0, 51.0, 59.0, 76.0, 65.0, 63.0, 68.0, 37.0, 36.0, 53.0, 38.0, 25.0, 19.0, 16.0, 14.0, 17.0, 10.0, 13.0, 9.0, 9.0, 7.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007963180541992188, -0.00077095627784729, -0.0007455945014953613, -0.0007202327251434326, -0.0006948709487915039, -0.0006695091724395752, -0.0006441473960876465, -0.0006187856197357178, -0.0005934238433837891, -0.0005680620670318604, -0.0005427002906799316, -0.0005173385143280029, -0.0004919767379760742, -0.0004666149616241455, -0.0004412531852722168, -0.0004158914089202881, -0.0003905296325683594, -0.00036516785621643066, -0.00033980607986450195, -0.00031444430351257324, -0.00028908252716064453, -0.0002637207508087158, -0.0002383589744567871, -0.0002129971981048584, -0.0001876354217529297, -0.00016227364540100098, -0.00013691186904907227, -0.00011155009269714355, -8.618831634521484e-05, -6.082653999328613e-05, -3.546476364135742e-05, -1.0102987289428711e-05, 1.52587890625e-05, 4.062056541442871e-05, 6.598234176635742e-05, 9.134411811828613e-05, 0.00011670589447021484, 0.00014206767082214355, 0.00016742944717407227, 0.00019279122352600098, 0.0002181529998779297, 0.0002435147762298584, 0.0002688765525817871, 0.0002942383289337158, 0.00031960010528564453, 0.00034496188163757324, 0.00037032365798950195, 0.00039568543434143066, 0.0004210472106933594, 0.0004464089870452881, 0.0004717707633972168, 0.0004971325397491455, 0.0005224943161010742, 0.0005478560924530029, 0.0005732178688049316, 0.0005985796451568604, 0.0006239414215087891, 0.0006493031978607178, 0.0006746649742126465, 0.0007000267505645752, 0.0007253885269165039, 0.0007507503032684326, 0.0007761120796203613, 0.00080147385597229, 0.0008268356323242188]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 5.0, 9.0, 7.0, 13.0, 16.0, 17.0, 18.0, 21.0, 32.0, 32.0, 55.0, 66.0, 102.0, 121.0, 244.0, 638.0, 6659.0, 1029628.0, 9308.0, 669.0, 272.0, 159.0, 116.0, 68.0, 64.0, 27.0, 32.0, 24.0, 20.0, 20.0, 17.0, 11.0, 5.0, 10.0, 7.0, 6.0, 8.0, 8.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0182037353515625, -0.017644166946411133, -0.017084598541259766, -0.0165250301361084, -0.01596546173095703, -0.015405893325805664, -0.014846324920654297, -0.01428675651550293, -0.013727188110351562, -0.013167619705200195, -0.012608051300048828, -0.012048482894897461, -0.011488914489746094, -0.010929346084594727, -0.01036977767944336, -0.009810209274291992, -0.009250640869140625, -0.008691072463989258, -0.00813150405883789, -0.0075719356536865234, -0.007012367248535156, -0.006452798843383789, -0.005893230438232422, -0.005333662033081055, -0.0047740936279296875, -0.00421452522277832, -0.003654956817626953, -0.003095388412475586, -0.0025358200073242188, -0.0019762516021728516, -0.0014166831970214844, -0.0008571147918701172, -0.00029754638671875, 0.0002620220184326172, 0.0008215904235839844, 0.0013811588287353516, 0.0019407272338867188, 0.002500295639038086, 0.003059864044189453, 0.0036194324493408203, 0.0041790008544921875, 0.004738569259643555, 0.005298137664794922, 0.005857706069946289, 0.006417274475097656, 0.0069768428802490234, 0.007536411285400391, 0.008095979690551758, 0.008655548095703125, 0.009215116500854492, 0.00977468490600586, 0.010334253311157227, 0.010893821716308594, 0.011453390121459961, 0.012012958526611328, 0.012572526931762695, 0.013132095336914062, 0.01369166374206543, 0.014251232147216797, 0.014810800552368164, 0.015370368957519531, 0.0159299373626709, 0.016489505767822266, 0.017049074172973633, 0.017608642578125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 8.0, 106.0, 418.0, 396.0, 82.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.003527667373418808, -0.0034570051357150078, -0.003386342665180564, -0.00331568019464612, -0.00324501795694232, -0.0031743557192385197, -0.003103693248704076, -0.003033030778169632, -0.0029623685404658318, -0.0028917063027620316, -0.0028210438322275877, -0.002750381361693144, -0.0026797191239893436, -0.0026090568862855434, -0.0025383944157510996, -0.0024677319452166557, -0.0023970697075128555, -0.0023264074698090553, -0.0022557449992746115, -0.0021850825287401676, -0.0021144202910363674, -0.002043758053332567, -0.0019730955827981234, -0.0019024332286790013, -0.0018317708745598793, -0.0017611085204407573, -0.0016904461663216352, -0.0016197838122025132, -0.0015491214580833912, -0.0014784591039642692, -0.0014077967498451471, -0.001337134395726025, -0.0012664722744375467, -0.0011958099203184247, -0.0011251475661993027, -0.0010544852120801806, -0.0009838228579610586, -0.0009131605038419366, -0.0008424981497228146, -0.0007718357956036925, -0.0007011734414845705, -0.0006305110873654485, -0.0005598487332463264, -0.0004891863791272044, -0.0004185240250080824, -0.00034786167088896036, -0.00027719931676983833, -0.0002065369626507163, -0.00013587460853159428, -6.521225441247225e-05, 5.45009970664978e-06, 7.611245382577181e-05, 0.00014677480794489384, 0.00021743716206401587, 0.0002880995161831379, 0.0003587618703022599, 0.00042942422442138195, 0.000500086578540504, 0.000570748932659626, 0.000641411286778748, 0.0007120736408978701, 0.0007827359950169921, 0.0008533983491361141, 0.0009240607032552361, 0.0009947230573743582]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 8.0, 1.0, 12.0, 6.0, 8.0, 18.0, 17.0, 10.0, 21.0, 16.0, 13.0, 27.0, 29.0, 27.0, 38.0, 44.0, 29.0, 29.0, 50.0, 42.0, 29.0, 38.0, 35.0, 47.0, 31.0, 38.0, 29.0, 33.0, 40.0, 38.0, 25.0, 26.0, 19.0, 24.0, 16.0, 14.0, 13.0, 11.0, 5.0, 6.0, 8.0, 9.0, 5.0, 5.0, 4.0, 1.0, 1.0, 7.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00041228532791137695, -0.00039972737431526184, -0.00038716942071914673, -0.0003746114671230316, -0.0003620535135269165, -0.0003494955599308014, -0.0003369376063346863, -0.00032437965273857117, -0.00031182169914245605, -0.00029926374554634094, -0.00028670579195022583, -0.0002741478383541107, -0.0002615898847579956, -0.0002490319311618805, -0.00023647397756576538, -0.00022391602396965027, -0.00021135807037353516, -0.00019880011677742004, -0.00018624216318130493, -0.00017368420958518982, -0.0001611262559890747, -0.0001485683023929596, -0.00013601034879684448, -0.00012345239520072937, -0.00011089444160461426, -9.833648800849915e-05, -8.577853441238403e-05, -7.322058081626892e-05, -6.066262722015381e-05, -4.8104673624038696e-05, -3.5546720027923584e-05, -2.298876643180847e-05, -1.043081283569336e-05, 2.127140760421753e-06, 1.4685094356536865e-05, 2.7243047952651978e-05, 3.980100154876709e-05, 5.23589551448822e-05, 6.491690874099731e-05, 7.747486233711243e-05, 9.003281593322754e-05, 0.00010259076952934265, 0.00011514872312545776, 0.00012770667672157288, 0.000140264630317688, 0.0001528225839138031, 0.0001653805375099182, 0.00017793849110603333, 0.00019049644470214844, 0.00020305439829826355, 0.00021561235189437866, 0.00022817030549049377, 0.0002407282590866089, 0.000253286212682724, 0.0002658441662788391, 0.0002784021198749542, 0.00029096007347106934, 0.00030351802706718445, 0.00031607598066329956, 0.00032863393425941467, 0.0003411918878555298, 0.0003537498414516449, 0.00036630779504776, 0.0003788657486438751, 0.00039142370223999023]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 8.0, 3.0, 15.0, 10.0, 21.0, 21.0, 20.0, 21.0, 23.0, 19.0, 31.0, 30.0, 26.0, 35.0, 37.0, 33.0, 24.0, 36.0, 48.0, 33.0, 33.0, 34.0, 28.0, 41.0, 31.0, 39.0, 34.0, 26.0, 28.0, 25.0, 21.0, 24.0, 17.0, 12.0, 15.0, 15.0, 13.0, 6.0, 4.0, 12.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.81640625, -5.62738037109375, -5.4383544921875, -5.24932861328125, -5.060302734375, -4.87127685546875, -4.6822509765625, -4.49322509765625, -4.30419921875, -4.11517333984375, -3.9261474609375, -3.73712158203125, -3.548095703125, -3.35906982421875, -3.1700439453125, -2.98101806640625, -2.7919921875, -2.60296630859375, -2.4139404296875, -2.22491455078125, -2.035888671875, -1.84686279296875, -1.6578369140625, -1.46881103515625, -1.27978515625, -1.09075927734375, -0.9017333984375, -0.71270751953125, -0.523681640625, -0.33465576171875, -0.1456298828125, 0.04339599609375, 0.232421875, 0.42144775390625, 0.6104736328125, 0.79949951171875, 0.988525390625, 1.17755126953125, 1.3665771484375, 1.55560302734375, 1.74462890625, 1.93365478515625, 2.1226806640625, 2.31170654296875, 2.500732421875, 2.68975830078125, 2.8787841796875, 3.06781005859375, 3.2568359375, 3.44586181640625, 3.6348876953125, 3.82391357421875, 4.012939453125, 4.20196533203125, 4.3909912109375, 4.58001708984375, 4.76904296875, 4.95806884765625, 5.1470947265625, 5.33612060546875, 5.525146484375, 5.71417236328125, 5.9031982421875, 6.09222412109375, 6.28125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 9.0, 7.0, 17.0, 15.0, 20.0, 22.0, 29.0, 40.0, 48.0, 62.0, 66.0, 106.0, 142.0, 199.0, 243.0, 382.0, 624.0, 1340.0, 4840.0, 26701.0, 186148.0, 692156.0, 112035.0, 16976.0, 3326.0, 1109.0, 582.0, 357.0, 254.0, 161.0, 120.0, 90.0, 64.0, 55.0, 38.0, 31.0, 28.0, 16.0, 13.0, 18.0, 13.0, 18.0, 3.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0], "bins": [-11.015625, -10.66455078125, -10.3134765625, -9.96240234375, -9.611328125, -9.26025390625, -8.9091796875, -8.55810546875, -8.20703125, -7.85595703125, -7.5048828125, -7.15380859375, -6.802734375, -6.45166015625, -6.1005859375, -5.74951171875, -5.3984375, -5.04736328125, -4.6962890625, -4.34521484375, -3.994140625, -3.64306640625, -3.2919921875, -2.94091796875, -2.58984375, -2.23876953125, -1.8876953125, -1.53662109375, -1.185546875, -0.83447265625, -0.4833984375, -0.13232421875, 0.21875, 0.56982421875, 0.9208984375, 1.27197265625, 1.623046875, 1.97412109375, 2.3251953125, 2.67626953125, 3.02734375, 3.37841796875, 3.7294921875, 4.08056640625, 4.431640625, 4.78271484375, 5.1337890625, 5.48486328125, 5.8359375, 6.18701171875, 6.5380859375, 6.88916015625, 7.240234375, 7.59130859375, 7.9423828125, 8.29345703125, 8.64453125, 8.99560546875, 9.3466796875, 9.69775390625, 10.048828125, 10.39990234375, 10.7509765625, 11.10205078125, 11.453125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 4.0, 8.0, 4.0, 6.0, 8.0, 13.0, 6.0, 12.0, 16.0, 16.0, 16.0, 23.0, 33.0, 42.0, 43.0, 49.0, 62.0, 63.0, 117.0, 387.0, 1553.0, 154.0, 75.0, 50.0, 42.0, 42.0, 34.0, 32.0, 22.0, 26.0, 18.0, 16.0, 12.0, 8.0, 7.0, 3.0, 5.0, 2.0, 6.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.09375, -23.34326171875, -22.5927734375, -21.84228515625, -21.091796875, -20.34130859375, -19.5908203125, -18.84033203125, -18.08984375, -17.33935546875, -16.5888671875, -15.83837890625, -15.087890625, -14.33740234375, -13.5869140625, -12.83642578125, -12.0859375, -11.33544921875, -10.5849609375, -9.83447265625, -9.083984375, -8.33349609375, -7.5830078125, -6.83251953125, -6.08203125, -5.33154296875, -4.5810546875, -3.83056640625, -3.080078125, -2.32958984375, -1.5791015625, -0.82861328125, -0.078125, 0.67236328125, 1.4228515625, 2.17333984375, 2.923828125, 3.67431640625, 4.4248046875, 5.17529296875, 5.92578125, 6.67626953125, 7.4267578125, 8.17724609375, 8.927734375, 9.67822265625, 10.4287109375, 11.17919921875, 11.9296875, 12.68017578125, 13.4306640625, 14.18115234375, 14.931640625, 15.68212890625, 16.4326171875, 17.18310546875, 17.93359375, 18.68408203125, 19.4345703125, 20.18505859375, 20.935546875, 21.68603515625, 22.4365234375, 23.18701171875, 23.9375]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 5.0, 5.0, 8.0, 10.0, 12.0, 13.0, 24.0, 34.0, 31.0, 47.0, 59.0, 80.0, 127.0, 240.0, 489.0, 2072.0, 2468391.0, 671154.0, 1699.0, 455.0, 245.0, 125.0, 91.0, 64.0, 44.0, 34.0, 19.0, 26.0, 17.0, 13.0, 7.0, 8.0, 13.0, 7.0, 4.0, 8.0, 3.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.0, -69.7470703125, -67.494140625, -65.2412109375, -62.98828125, -60.7353515625, -58.482421875, -56.2294921875, -53.9765625, -51.7236328125, -49.470703125, -47.2177734375, -44.96484375, -42.7119140625, -40.458984375, -38.2060546875, -35.953125, -33.7001953125, -31.447265625, -29.1943359375, -26.94140625, -24.6884765625, -22.435546875, -20.1826171875, -17.9296875, -15.6767578125, -13.423828125, -11.1708984375, -8.91796875, -6.6650390625, -4.412109375, -2.1591796875, 0.09375, 2.3466796875, 4.599609375, 6.8525390625, 9.10546875, 11.3583984375, 13.611328125, 15.8642578125, 18.1171875, 20.3701171875, 22.623046875, 24.8759765625, 27.12890625, 29.3818359375, 31.634765625, 33.8876953125, 36.140625, 38.3935546875, 40.646484375, 42.8994140625, 45.15234375, 47.4052734375, 49.658203125, 51.9111328125, 54.1640625, 56.4169921875, 58.669921875, 60.9228515625, 63.17578125, 65.4287109375, 67.681640625, 69.9345703125, 72.1875]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 39.0, 624.0, 347.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.81189727783203, -30.363893508911133, -25.915889739990234, -21.467884063720703, -17.019880294799805, -12.571876525878906, -8.123870849609375, -3.6758670806884766, 0.7721366882324219, 5.2201409339904785, 9.668145179748535, 14.11614990234375, 18.56415367126465, 23.012157440185547, 27.460163116455078, 31.908166885375977, 36.356170654296875, 40.804176330566406, 45.25217819213867, 49.7001838684082, 54.14818572998047, 58.59619140625, 63.04419708251953, 67.49220275878906, 71.94020080566406, 76.3882064819336, 80.83621215820312, 85.28421020507812, 89.73221588134766, 94.18022155761719, 98.62822723388672, 103.07623291015625, 107.52424621582031, 111.97225189208984, 116.42025756835938, 120.86825561523438, 125.3162612915039, 129.76426696777344, 134.2122802734375, 138.6602783203125, 143.1082763671875, 147.5562744140625, 152.00428771972656, 156.45228576660156, 160.90029907226562, 165.34829711914062, 169.79629516601562, 174.2443084716797, 178.69232177734375, 183.14031982421875, 187.5883331298828, 192.0363311767578, 196.48434448242188, 200.93234252929688, 205.38034057617188, 209.82835388183594, 214.27635192871094, 218.72434997558594, 223.17236328125, 227.620361328125, 232.06837463378906, 236.51637268066406, 240.96438598632812, 245.41238403320312, 249.86038208007812]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 5.0, 9.0, 12.0, 18.0, 11.0, 14.0, 9.0, 18.0, 18.0, 28.0, 20.0, 16.0, 31.0, 30.0, 26.0, 40.0, 38.0, 40.0, 50.0, 37.0, 38.0, 42.0, 36.0, 40.0, 41.0, 30.0, 36.0, 30.0, 30.0, 26.0, 24.0, 25.0, 15.0, 20.0, 19.0, 14.0, 10.0, 8.0, 7.0, 9.0, 7.0, 5.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-67.60147094726562, -65.7191390991211, -63.836814880371094, -61.95448684692383, -60.07215881347656, -58.1898307800293, -56.30750274658203, -54.4251708984375, -52.5428466796875, -50.660518646240234, -48.77819061279297, -46.8958625793457, -45.01353454589844, -43.13120651245117, -41.248878479003906, -39.366546630859375, -37.48421859741211, -35.601890563964844, -33.71956253051758, -31.837234497070312, -29.954906463623047, -28.07257843017578, -26.190248489379883, -24.307920455932617, -22.42559242248535, -20.543264389038086, -18.66093635559082, -16.778606414794922, -14.896279335021973, -13.013951301574707, -11.131622314453125, -9.24929428100586, -7.366970062255859, -5.484642028808594, -3.60231351852417, -1.719985008239746, 0.16234302520751953, 2.044671058654785, 3.927000045776367, 5.809328079223633, 7.691656112670898, 9.573984146118164, 11.45631217956543, 13.338641166687012, 15.220969200134277, 17.10329818725586, 18.985626220703125, 20.86795425415039, 22.750282287597656, 24.632610321044922, 26.514938354492188, 28.397266387939453, 30.27959442138672, 32.161922454833984, 34.04425048828125, 35.92658233642578, 37.80890655517578, 39.69123458862305, 41.57356262207031, 43.45589065551758, 45.338218688964844, 47.22054672241211, 49.102874755859375, 50.985206604003906, 52.86753463745117]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 6.0, 11.0, 6.0, 11.0, 10.0, 15.0, 24.0, 25.0, 16.0, 24.0, 26.0, 33.0, 23.0, 32.0, 28.0, 41.0, 33.0, 43.0, 29.0, 31.0, 39.0, 41.0, 41.0, 33.0, 37.0, 36.0, 31.0, 31.0, 23.0, 36.0, 23.0, 17.0, 24.0, 15.0, 13.0, 18.0, 8.0, 11.0, 5.0, 8.0, 6.0, 7.0, 11.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0], "bins": [-6.4140625, -6.21051025390625, -6.0069580078125, -5.80340576171875, -5.599853515625, -5.39630126953125, -5.1927490234375, -4.98919677734375, -4.78564453125, -4.58209228515625, -4.3785400390625, -4.17498779296875, -3.971435546875, -3.76788330078125, -3.5643310546875, -3.36077880859375, -3.1572265625, -2.95367431640625, -2.7501220703125, -2.54656982421875, -2.343017578125, -2.13946533203125, -1.9359130859375, -1.73236083984375, -1.52880859375, -1.32525634765625, -1.1217041015625, -0.91815185546875, -0.714599609375, -0.51104736328125, -0.3074951171875, -0.10394287109375, 0.099609375, 0.30316162109375, 0.5067138671875, 0.71026611328125, 0.913818359375, 1.11737060546875, 1.3209228515625, 1.52447509765625, 1.72802734375, 1.93157958984375, 2.1351318359375, 2.33868408203125, 2.542236328125, 2.74578857421875, 2.9493408203125, 3.15289306640625, 3.3564453125, 3.55999755859375, 3.7635498046875, 3.96710205078125, 4.170654296875, 4.37420654296875, 4.5777587890625, 4.78131103515625, 4.98486328125, 5.18841552734375, 5.3919677734375, 5.59552001953125, 5.799072265625, 6.00262451171875, 6.2061767578125, 6.40972900390625, 6.61328125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 6.0, 5.0, 9.0, 7.0, 13.0, 16.0, 21.0, 34.0, 39.0, 63.0, 78.0, 98.0, 149.0, 223.0, 325.0, 551.0, 1258.0, 2993.0, 8734.0, 31189.0, 146124.0, 641982.0, 1585512.0, 1288237.0, 380293.0, 77991.0, 18018.0, 5678.0, 2162.0, 995.0, 509.0, 281.0, 187.0, 123.0, 103.0, 68.0, 42.0, 40.0, 28.0, 23.0, 22.0, 15.0, 6.0, 8.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-9.140625, -8.843994140625, -8.54736328125, -8.250732421875, -7.9541015625, -7.657470703125, -7.36083984375, -7.064208984375, -6.767578125, -6.470947265625, -6.17431640625, -5.877685546875, -5.5810546875, -5.284423828125, -4.98779296875, -4.691162109375, -4.39453125, -4.097900390625, -3.80126953125, -3.504638671875, -3.2080078125, -2.911376953125, -2.61474609375, -2.318115234375, -2.021484375, -1.724853515625, -1.42822265625, -1.131591796875, -0.8349609375, -0.538330078125, -0.24169921875, 0.054931640625, 0.3515625, 0.648193359375, 0.94482421875, 1.241455078125, 1.5380859375, 1.834716796875, 2.13134765625, 2.427978515625, 2.724609375, 3.021240234375, 3.31787109375, 3.614501953125, 3.9111328125, 4.207763671875, 4.50439453125, 4.801025390625, 5.09765625, 5.394287109375, 5.69091796875, 5.987548828125, 6.2841796875, 6.580810546875, 6.87744140625, 7.174072265625, 7.470703125, 7.767333984375, 8.06396484375, 8.360595703125, 8.6572265625, 8.953857421875, 9.25048828125, 9.547119140625, 9.84375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 2.0, 5.0, 11.0, 15.0, 20.0, 27.0, 34.0, 64.0, 68.0, 77.0, 114.0, 167.0, 215.0, 253.0, 373.0, 419.0, 448.0, 424.0, 322.0, 249.0, 188.0, 131.0, 104.0, 90.0, 70.0, 40.0, 44.0, 31.0, 19.0, 16.0, 6.0, 7.0, 3.0, 4.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4453125, -11.02685546875, -10.6083984375, -10.18994140625, -9.771484375, -9.35302734375, -8.9345703125, -8.51611328125, -8.09765625, -7.67919921875, -7.2607421875, -6.84228515625, -6.423828125, -6.00537109375, -5.5869140625, -5.16845703125, -4.75, -4.33154296875, -3.9130859375, -3.49462890625, -3.076171875, -2.65771484375, -2.2392578125, -1.82080078125, -1.40234375, -0.98388671875, -0.5654296875, -0.14697265625, 0.271484375, 0.68994140625, 1.1083984375, 1.52685546875, 1.9453125, 2.36376953125, 2.7822265625, 3.20068359375, 3.619140625, 4.03759765625, 4.4560546875, 4.87451171875, 5.29296875, 5.71142578125, 6.1298828125, 6.54833984375, 6.966796875, 7.38525390625, 7.8037109375, 8.22216796875, 8.640625, 9.05908203125, 9.4775390625, 9.89599609375, 10.314453125, 10.73291015625, 11.1513671875, 11.56982421875, 11.98828125, 12.40673828125, 12.8251953125, 13.24365234375, 13.662109375, 14.08056640625, 14.4990234375, 14.91748046875, 15.3359375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 7.0, 11.0, 19.0, 11.0, 30.0, 40.0, 31.0, 60.0, 74.0, 93.0, 110.0, 132.0, 176.0, 211.0, 282.0, 426.0, 798.0, 3302.0, 130652.0, 4010761.0, 42409.0, 2288.0, 670.0, 373.0, 288.0, 199.0, 167.0, 158.0, 105.0, 81.0, 79.0, 51.0, 47.0, 38.0, 26.0, 20.0, 16.0, 8.0, 9.0, 6.0, 6.0, 5.0, 2.0, 3.0, 2.0, 1.0], "bins": [-61.1875, -59.55126953125, -57.9150390625, -56.27880859375, -54.642578125, -53.00634765625, -51.3701171875, -49.73388671875, -48.09765625, -46.46142578125, -44.8251953125, -43.18896484375, -41.552734375, -39.91650390625, -38.2802734375, -36.64404296875, -35.0078125, -33.37158203125, -31.7353515625, -30.09912109375, -28.462890625, -26.82666015625, -25.1904296875, -23.55419921875, -21.91796875, -20.28173828125, -18.6455078125, -17.00927734375, -15.373046875, -13.73681640625, -12.1005859375, -10.46435546875, -8.828125, -7.19189453125, -5.5556640625, -3.91943359375, -2.283203125, -0.64697265625, 0.9892578125, 2.62548828125, 4.26171875, 5.89794921875, 7.5341796875, 9.17041015625, 10.806640625, 12.44287109375, 14.0791015625, 15.71533203125, 17.3515625, 18.98779296875, 20.6240234375, 22.26025390625, 23.896484375, 25.53271484375, 27.1689453125, 28.80517578125, 30.44140625, 32.07763671875, 33.7138671875, 35.35009765625, 36.986328125, 38.62255859375, 40.2587890625, 41.89501953125, 43.53125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 346.0, 660.0, 13.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.63055419921875, -103.16645812988281, -88.70236206054688, -74.23826599121094, -59.774173736572266, -45.310081481933594, -30.845985412597656, -16.38188934326172, -1.9177932739257812, 12.54630184173584, 27.01039695739746, 41.474491119384766, 55.9385871887207, 70.40267944335938, 84.86677551269531, 99.33087158203125, 113.79496765136719, 128.25906372070312, 142.72315979003906, 157.187255859375, 171.65135192871094, 186.11544799804688, 200.57952880859375, 215.04364013671875, 229.50772094726562, 243.97181701660156, 258.4359130859375, 272.8999938964844, 287.3641052246094, 301.82818603515625, 316.29229736328125, 330.7563781738281, 345.2204895019531, 359.6845703125, 374.148681640625, 388.6127624511719, 403.0768737792969, 417.54095458984375, 432.00506591796875, 446.4691467285156, 460.9332580566406, 475.3973388671875, 489.8614501953125, 504.3255310058594, 518.7896118164062, 533.2537231445312, 547.7178344726562, 562.1819458007812, 576.64599609375, 591.110107421875, 605.5741577148438, 620.0382690429688, 634.5023803710938, 648.9664916992188, 663.4305419921875, 677.8946533203125, 692.3587646484375, 706.8228759765625, 721.2869262695312, 735.7510375976562, 750.2151489257812, 764.6792602539062, 779.143310546875, 793.607421875, 808.071533203125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 11.0, 2.0, 4.0, 7.0, 15.0, 14.0, 20.0, 12.0, 16.0, 28.0, 30.0, 33.0, 33.0, 44.0, 38.0, 43.0, 35.0, 41.0, 52.0, 50.0, 38.0, 43.0, 38.0, 39.0, 34.0, 33.0, 42.0, 32.0, 30.0, 24.0, 26.0, 21.0, 12.0, 12.0, 14.0, 8.0, 9.0, 4.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0], "bins": [-61.0047607421875, -59.44115447998047, -57.87754440307617, -56.313934326171875, -54.750328063964844, -53.18672180175781, -51.623111724853516, -50.05950164794922, -48.49589538574219, -46.932289123535156, -45.36867904663086, -43.80506896972656, -42.24146270751953, -40.6778564453125, -39.1142463684082, -37.550636291503906, -35.987030029296875, -34.423423767089844, -32.85981369018555, -31.296205520629883, -29.73259735107422, -28.168989181518555, -26.60538101196289, -25.041772842407227, -23.478164672851562, -21.9145565032959, -20.350948333740234, -18.78734016418457, -17.223731994628906, -15.660123825073242, -14.096515655517578, -12.532907485961914, -10.96929931640625, -9.405691146850586, -7.842082977294922, -6.278474807739258, -4.714866638183594, -3.1512584686279297, -1.5876502990722656, -0.024042129516601562, 1.5395660400390625, 3.1031742095947266, 4.666782379150391, 6.230390548706055, 7.793998718261719, 9.357606887817383, 10.921215057373047, 12.484823226928711, 14.048431396484375, 15.612039566040039, 17.175647735595703, 18.739255905151367, 20.30286407470703, 21.866472244262695, 23.43008041381836, 24.993688583374023, 26.557296752929688, 28.12090492248535, 29.684513092041016, 31.24812126159668, 32.811729431152344, 34.375335693359375, 35.93894577026367, 37.50255584716797, 39.066162109375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 3.0, 3.0, 1.0, 5.0, 10.0, 5.0, 8.0, 6.0, 16.0, 20.0, 16.0, 17.0, 16.0, 25.0, 15.0, 27.0, 27.0, 30.0, 28.0, 27.0, 30.0, 26.0, 39.0, 23.0, 29.0, 29.0, 27.0, 24.0, 32.0, 40.0, 30.0, 41.0, 27.0, 33.0, 22.0, 26.0, 27.0, 27.0, 15.0, 17.0, 21.0, 15.0, 16.0, 11.0, 13.0, 7.0, 12.0, 7.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-5.42578125, -5.24853515625, -5.0712890625, -4.89404296875, -4.716796875, -4.53955078125, -4.3623046875, -4.18505859375, -4.0078125, -3.83056640625, -3.6533203125, -3.47607421875, -3.298828125, -3.12158203125, -2.9443359375, -2.76708984375, -2.58984375, -2.41259765625, -2.2353515625, -2.05810546875, -1.880859375, -1.70361328125, -1.5263671875, -1.34912109375, -1.171875, -0.99462890625, -0.8173828125, -0.64013671875, -0.462890625, -0.28564453125, -0.1083984375, 0.06884765625, 0.24609375, 0.42333984375, 0.6005859375, 0.77783203125, 0.955078125, 1.13232421875, 1.3095703125, 1.48681640625, 1.6640625, 1.84130859375, 2.0185546875, 2.19580078125, 2.373046875, 2.55029296875, 2.7275390625, 2.90478515625, 3.08203125, 3.25927734375, 3.4365234375, 3.61376953125, 3.791015625, 3.96826171875, 4.1455078125, 4.32275390625, 4.5, 4.67724609375, 4.8544921875, 5.03173828125, 5.208984375, 5.38623046875, 5.5634765625, 5.74072265625, 5.91796875]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 7.0, 10.0, 10.0, 16.0, 23.0, 35.0, 48.0, 51.0, 84.0, 170.0, 212.0, 327.0, 471.0, 684.0, 956.0, 1417.0, 2065.0, 2909.0, 4284.0, 6202.0, 8956.0, 13297.0, 19208.0, 28964.0, 44088.0, 71810.0, 129324.0, 261831.0, 187700.0, 95796.0, 56180.0, 35897.0, 24195.0, 16196.0, 10901.0, 7595.0, 5096.0, 3662.0, 2375.0, 1698.0, 1195.0, 778.0, 572.0, 403.0, 270.0, 183.0, 117.0, 93.0, 64.0, 34.0, 27.0, 25.0, 16.0, 11.0, 9.0, 8.0, 2.0, 5.0, 0.0, 3.0, 1.0], "bins": [-1.1650390625, -1.127166748046875, -1.08929443359375, -1.051422119140625, -1.0135498046875, -0.975677490234375, -0.93780517578125, -0.899932861328125, -0.862060546875, -0.824188232421875, -0.78631591796875, -0.748443603515625, -0.7105712890625, -0.672698974609375, -0.63482666015625, -0.596954345703125, -0.55908203125, -0.521209716796875, -0.48333740234375, -0.445465087890625, -0.4075927734375, -0.369720458984375, -0.33184814453125, -0.293975830078125, -0.256103515625, -0.218231201171875, -0.18035888671875, -0.142486572265625, -0.1046142578125, -0.066741943359375, -0.02886962890625, 0.009002685546875, 0.046875, 0.084747314453125, 0.12261962890625, 0.160491943359375, 0.1983642578125, 0.236236572265625, 0.27410888671875, 0.311981201171875, 0.349853515625, 0.387725830078125, 0.42559814453125, 0.463470458984375, 0.5013427734375, 0.539215087890625, 0.57708740234375, 0.614959716796875, 0.65283203125, 0.690704345703125, 0.72857666015625, 0.766448974609375, 0.8043212890625, 0.842193603515625, 0.88006591796875, 0.917938232421875, 0.955810546875, 0.993682861328125, 1.03155517578125, 1.069427490234375, 1.1072998046875, 1.145172119140625, 1.18304443359375, 1.220916748046875, 1.2587890625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 6.0, 7.0, 7.0, 6.0, 16.0, 10.0, 15.0, 17.0, 17.0, 25.0, 23.0, 24.0, 23.0, 35.0, 32.0, 29.0, 35.0, 32.0, 33.0, 47.0, 33.0, 1065.0, 43.0, 42.0, 39.0, 47.0, 42.0, 43.0, 30.0, 36.0, 25.0, 26.0, 20.0, 14.0, 15.0, 16.0, 15.0, 5.0, 7.0, 10.0, 3.0, 9.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.771484375, -3.632720947265625, -3.49395751953125, -3.355194091796875, -3.2164306640625, -3.077667236328125, -2.93890380859375, -2.800140380859375, -2.661376953125, -2.522613525390625, -2.38385009765625, -2.245086669921875, -2.1063232421875, -1.967559814453125, -1.82879638671875, -1.690032958984375, -1.55126953125, -1.412506103515625, -1.27374267578125, -1.134979248046875, -0.9962158203125, -0.857452392578125, -0.71868896484375, -0.579925537109375, -0.441162109375, -0.302398681640625, -0.16363525390625, -0.024871826171875, 0.1138916015625, 0.252655029296875, 0.39141845703125, 0.530181884765625, 0.6689453125, 0.807708740234375, 0.94647216796875, 1.085235595703125, 1.2239990234375, 1.362762451171875, 1.50152587890625, 1.640289306640625, 1.779052734375, 1.917816162109375, 2.05657958984375, 2.195343017578125, 2.3341064453125, 2.472869873046875, 2.61163330078125, 2.750396728515625, 2.88916015625, 3.027923583984375, 3.16668701171875, 3.305450439453125, 3.4442138671875, 3.582977294921875, 3.72174072265625, 3.860504150390625, 3.999267578125, 4.138031005859375, 4.27679443359375, 4.415557861328125, 4.5543212890625, 4.693084716796875, 4.83184814453125, 4.970611572265625, 5.109375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 10.0, 6.0, 7.0, 10.0, 11.0, 18.0, 25.0, 41.0, 60.0, 105.0, 212.0, 437.0, 799.0, 1574.0, 2972.0, 5667.0, 11221.0, 22517.0, 46081.0, 103744.0, 570577.0, 1134878.0, 103962.0, 46541.0, 22549.0, 11271.0, 5582.0, 2913.0, 1571.0, 791.0, 427.0, 217.0, 120.0, 67.0, 43.0, 25.0, 23.0, 22.0, 10.0, 7.0, 7.0, 7.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.49609375, -2.4286346435546875, -2.361175537109375, -2.2937164306640625, -2.22625732421875, -2.1587982177734375, -2.091339111328125, -2.0238800048828125, -1.9564208984375, -1.8889617919921875, -1.821502685546875, -1.7540435791015625, -1.68658447265625, -1.6191253662109375, -1.551666259765625, -1.4842071533203125, -1.416748046875, -1.3492889404296875, -1.281829833984375, -1.2143707275390625, -1.14691162109375, -1.0794525146484375, -1.011993408203125, -0.9445343017578125, -0.8770751953125, -0.8096160888671875, -0.742156982421875, -0.6746978759765625, -0.60723876953125, -0.5397796630859375, -0.472320556640625, -0.4048614501953125, -0.33740234375, -0.2699432373046875, -0.202484130859375, -0.1350250244140625, -0.06756591796875, -0.0001068115234375, 0.067352294921875, 0.1348114013671875, 0.2022705078125, 0.2697296142578125, 0.337188720703125, 0.4046478271484375, 0.47210693359375, 0.5395660400390625, 0.607025146484375, 0.6744842529296875, 0.741943359375, 0.8094024658203125, 0.876861572265625, 0.9443206787109375, 1.01177978515625, 1.0792388916015625, 1.146697998046875, 1.2141571044921875, 1.2816162109375, 1.3490753173828125, 1.416534423828125, 1.4839935302734375, 1.55145263671875, 1.6189117431640625, 1.686370849609375, 1.7538299560546875, 1.8212890625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 8.0, 4.0, 5.0, 8.0, 16.0, 12.0, 21.0, 29.0, 24.0, 29.0, 33.0, 36.0, 49.0, 52.0, 73.0, 74.0, 64.0, 54.0, 57.0, 60.0, 52.0, 49.0, 36.0, 28.0, 17.0, 22.0, 17.0, 10.0, 12.0, 10.0, 7.0, 12.0, 9.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0], "bins": [-0.0012302398681640625, -0.0011997595429420471, -0.0011692792177200317, -0.0011387988924980164, -0.001108318567276001, -0.0010778382420539856, -0.0010473579168319702, -0.0010168775916099548, -0.0009863972663879395, -0.0009559169411659241, -0.0009254366159439087, -0.0008949562907218933, -0.0008644759654998779, -0.0008339956402778625, -0.0008035153150558472, -0.0007730349898338318, -0.0007425546646118164, -0.000712074339389801, -0.0006815940141677856, -0.0006511136889457703, -0.0006206333637237549, -0.0005901530385017395, -0.0005596727132797241, -0.0005291923880577087, -0.0004987120628356934, -0.000468231737613678, -0.0004377514123916626, -0.0004072710871696472, -0.00037679076194763184, -0.00034631043672561646, -0.0003158301115036011, -0.0002853497862815857, -0.0002548694610595703, -0.00022438913583755493, -0.00019390881061553955, -0.00016342848539352417, -0.0001329481601715088, -0.00010246783494949341, -7.198750972747803e-05, -4.1507184505462646e-05, -1.1026859283447266e-05, 1.9453465938568115e-05, 4.9933791160583496e-05, 8.041411638259888e-05, 0.00011089444160461426, 0.00014137476682662964, 0.00017185509204864502, 0.0002023354172706604, 0.00023281574249267578, 0.00026329606771469116, 0.00029377639293670654, 0.0003242567181587219, 0.0003547370433807373, 0.0003852173686027527, 0.00041569769382476807, 0.00044617801904678345, 0.00047665834426879883, 0.0005071386694908142, 0.0005376189947128296, 0.000568099319934845, 0.0005985796451568604, 0.0006290599703788757, 0.0006595402956008911, 0.0006900206208229065, 0.0007205009460449219]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 8.0, 3.0, 6.0, 10.0, 12.0, 13.0, 9.0, 14.0, 30.0, 27.0, 32.0, 61.0, 61.0, 89.0, 110.0, 243.0, 578.0, 2578.0, 1035616.0, 7640.0, 666.0, 258.0, 125.0, 80.0, 63.0, 62.0, 38.0, 31.0, 24.0, 23.0, 12.0, 7.0, 6.0, 5.0, 7.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01776123046875, -0.017039060592651367, -0.016316890716552734, -0.015594720840454102, -0.014872550964355469, -0.014150381088256836, -0.013428211212158203, -0.01270604133605957, -0.011983871459960938, -0.011261701583862305, -0.010539531707763672, -0.009817361831665039, -0.009095191955566406, -0.008373022079467773, -0.007650852203369141, -0.006928682327270508, -0.006206512451171875, -0.005484342575073242, -0.004762172698974609, -0.0040400028228759766, -0.0033178329467773438, -0.002595663070678711, -0.0018734931945800781, -0.0011513233184814453, -0.0004291534423828125, 0.0002930164337158203, 0.0010151863098144531, 0.001737356185913086, 0.0024595260620117188, 0.0031816959381103516, 0.0039038658142089844, 0.004626035690307617, 0.00534820556640625, 0.006070375442504883, 0.006792545318603516, 0.0075147151947021484, 0.008236885070800781, 0.008959054946899414, 0.009681224822998047, 0.01040339469909668, 0.011125564575195312, 0.011847734451293945, 0.012569904327392578, 0.013292074203491211, 0.014014244079589844, 0.014736413955688477, 0.01545858383178711, 0.016180753707885742, 0.016902923583984375, 0.017625093460083008, 0.01834726333618164, 0.019069433212280273, 0.019791603088378906, 0.02051377296447754, 0.021235942840576172, 0.021958112716674805, 0.022680282592773438, 0.02340245246887207, 0.024124622344970703, 0.024846792221069336, 0.02556896209716797, 0.0262911319732666, 0.027013301849365234, 0.027735471725463867, 0.0284576416015625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 10.0, 31.0, 96.0, 219.0, 292.0, 230.0, 91.0, 26.0, 8.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001026341924443841, -0.0009876744588837028, -0.0009490069933235645, -0.0009103394695557654, -0.0008716720039956272, -0.0008330045384354889, -0.0007943370146676898, -0.0007556695491075516, -0.0007170020835474133, -0.0006783346179872751, -0.0006396671524271369, -0.0006009996286593378, -0.0005623321630991995, -0.0005236646975390613, -0.0004849972028750926, -0.00044632970821112394, -0.0004076622426509857, -0.0003689947770908475, -0.0003303272824268788, -0.00029165978776291013, -0.0002529923222027719, -0.00021432484209071845, -0.000175657361978665, -0.0001369898673146963, -9.832240175455809e-05, -5.965492164250463e-05, -2.098744153045118e-05, 1.7680038581602275e-05, 5.634751869365573e-05, 9.501499880570918e-05, 0.00013368247891776264, 0.00017234997358173132, 0.00021101743914186954, 0.00024968490470200777, 0.00028835239936597645, 0.00032701989402994514, 0.00036568735959008336, 0.0004043548251502216, 0.00044302231981419027, 0.00048168981447815895, 0.0005203572800382972, 0.0005590247455984354, 0.0005976922111585736, 0.0006363597349263728, 0.000675027200486511, 0.0007136946660466492, 0.0007523621898144484, 0.0007910296553745866, 0.0008296971209347248, 0.000868364586494863, 0.0009070320520550013, 0.0009456995758228004, 0.0009843669831752777, 0.0010230345651507378, 0.001061702030710876, 0.0011003694962710142, 0.0011390369618311524, 0.0011777044273912907, 0.0012163718929514289, 0.0012550393585115671, 0.0012937069404870272, 0.0013323744060471654, 0.0013710418716073036, 0.0014097093371674418, 0.00144837680272758]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 4.0, 0.0, 3.0, 5.0, 9.0, 4.0, 8.0, 9.0, 9.0, 13.0, 18.0, 12.0, 14.0, 23.0, 23.0, 23.0, 24.0, 21.0, 35.0, 38.0, 30.0, 40.0, 35.0, 36.0, 44.0, 45.0, 34.0, 47.0, 54.0, 31.0, 23.0, 32.0, 29.0, 37.0, 30.0, 20.0, 28.0, 17.0, 7.0, 15.0, 10.0, 17.0, 13.0, 6.0, 5.0, 6.0, 7.0, 6.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00044977664947509766, -0.0004359520971775055, -0.00042212754487991333, -0.00040830299258232117, -0.000394478440284729, -0.00038065388798713684, -0.0003668293356895447, -0.0003530047833919525, -0.00033918023109436035, -0.0003253556787967682, -0.000311531126499176, -0.00029770657420158386, -0.0002838820219039917, -0.00027005746960639954, -0.0002562329173088074, -0.0002424083650112152, -0.00022858381271362305, -0.00021475926041603088, -0.00020093470811843872, -0.00018711015582084656, -0.0001732856035232544, -0.00015946105122566223, -0.00014563649892807007, -0.0001318119466304779, -0.00011798739433288574, -0.00010416284203529358, -9.033828973770142e-05, -7.651373744010925e-05, -6.268918514251709e-05, -4.886463284492493e-05, -3.5040080547332764e-05, -2.12155282497406e-05, -7.3909759521484375e-06, 6.433576345443726e-06, 2.025812864303589e-05, 3.408268094062805e-05, 4.7907233238220215e-05, 6.173178553581238e-05, 7.555633783340454e-05, 8.93808901309967e-05, 0.00010320544242858887, 0.00011702999472618103, 0.0001308545470237732, 0.00014467909932136536, 0.00015850365161895752, 0.00017232820391654968, 0.00018615275621414185, 0.000199977308511734, 0.00021380186080932617, 0.00022762641310691833, 0.0002414509654045105, 0.00025527551770210266, 0.0002691000699996948, 0.000282924622297287, 0.00029674917459487915, 0.0003105737268924713, 0.0003243982791900635, 0.00033822283148765564, 0.0003520473837852478, 0.00036587193608283997, 0.00037969648838043213, 0.0003935210406780243, 0.00040734559297561646, 0.0004211701452732086, 0.0004349946975708008]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 6.0, 3.0, 3.0, 1.0, 5.0, 10.0, 5.0, 8.0, 6.0, 16.0, 20.0, 16.0, 17.0, 16.0, 25.0, 15.0, 27.0, 27.0, 30.0, 28.0, 27.0, 30.0, 26.0, 39.0, 23.0, 29.0, 29.0, 27.0, 24.0, 32.0, 40.0, 30.0, 41.0, 27.0, 33.0, 22.0, 26.0, 27.0, 27.0, 15.0, 17.0, 21.0, 15.0, 16.0, 11.0, 13.0, 7.0, 12.0, 7.0, 6.0, 6.0, 2.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0], "bins": [-5.42578125, -5.24853515625, -5.0712890625, -4.89404296875, -4.716796875, -4.53955078125, -4.3623046875, -4.18505859375, -4.0078125, -3.83056640625, -3.6533203125, -3.47607421875, -3.298828125, -3.12158203125, -2.9443359375, -2.76708984375, -2.58984375, -2.41259765625, -2.2353515625, -2.05810546875, -1.880859375, -1.70361328125, -1.5263671875, -1.34912109375, -1.171875, -0.99462890625, -0.8173828125, -0.64013671875, -0.462890625, -0.28564453125, -0.1083984375, 0.06884765625, 0.24609375, 0.42333984375, 0.6005859375, 0.77783203125, 0.955078125, 1.13232421875, 1.3095703125, 1.48681640625, 1.6640625, 1.84130859375, 2.0185546875, 2.19580078125, 2.373046875, 2.55029296875, 2.7275390625, 2.90478515625, 3.08203125, 3.25927734375, 3.4365234375, 3.61376953125, 3.791015625, 3.96826171875, 4.1455078125, 4.32275390625, 4.5, 4.67724609375, 4.8544921875, 5.03173828125, 5.208984375, 5.38623046875, 5.5634765625, 5.74072265625, 5.91796875]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 0.0, 5.0, 3.0, 7.0, 13.0, 15.0, 10.0, 23.0, 17.0, 30.0, 33.0, 51.0, 83.0, 99.0, 172.0, 290.0, 463.0, 831.0, 1362.0, 2616.0, 4437.0, 8241.0, 15136.0, 28761.0, 57484.0, 125607.0, 275614.0, 277720.0, 127463.0, 58935.0, 28767.0, 15406.0, 8199.0, 4522.0, 2613.0, 1408.0, 815.0, 497.0, 263.0, 174.0, 93.0, 57.0, 53.0, 34.0, 32.0, 20.0, 13.0, 16.0, 10.0, 14.0, 8.0, 8.0, 5.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0], "bins": [-4.640625, -4.490966796875, -4.34130859375, -4.191650390625, -4.0419921875, -3.892333984375, -3.74267578125, -3.593017578125, -3.443359375, -3.293701171875, -3.14404296875, -2.994384765625, -2.8447265625, -2.695068359375, -2.54541015625, -2.395751953125, -2.24609375, -2.096435546875, -1.94677734375, -1.797119140625, -1.6474609375, -1.497802734375, -1.34814453125, -1.198486328125, -1.048828125, -0.899169921875, -0.74951171875, -0.599853515625, -0.4501953125, -0.300537109375, -0.15087890625, -0.001220703125, 0.1484375, 0.298095703125, 0.44775390625, 0.597412109375, 0.7470703125, 0.896728515625, 1.04638671875, 1.196044921875, 1.345703125, 1.495361328125, 1.64501953125, 1.794677734375, 1.9443359375, 2.093994140625, 2.24365234375, 2.393310546875, 2.54296875, 2.692626953125, 2.84228515625, 2.991943359375, 3.1416015625, 3.291259765625, 3.44091796875, 3.590576171875, 3.740234375, 3.889892578125, 4.03955078125, 4.189208984375, 4.3388671875, 4.488525390625, 4.63818359375, 4.787841796875, 4.9375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 1.0, 6.0, 3.0, 13.0, 4.0, 17.0, 10.0, 14.0, 24.0, 24.0, 26.0, 40.0, 49.0, 44.0, 63.0, 57.0, 84.0, 205.0, 1638.0, 230.0, 105.0, 60.0, 46.0, 43.0, 30.0, 32.0, 30.0, 20.0, 27.0, 21.0, 14.0, 18.0, 14.0, 7.0, 9.0, 3.0, 3.0, 3.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.5625, -24.776611328125, -23.99072265625, -23.204833984375, -22.4189453125, -21.633056640625, -20.84716796875, -20.061279296875, -19.275390625, -18.489501953125, -17.70361328125, -16.917724609375, -16.1318359375, -15.345947265625, -14.56005859375, -13.774169921875, -12.98828125, -12.202392578125, -11.41650390625, -10.630615234375, -9.8447265625, -9.058837890625, -8.27294921875, -7.487060546875, -6.701171875, -5.915283203125, -5.12939453125, -4.343505859375, -3.5576171875, -2.771728515625, -1.98583984375, -1.199951171875, -0.4140625, 0.371826171875, 1.15771484375, 1.943603515625, 2.7294921875, 3.515380859375, 4.30126953125, 5.087158203125, 5.873046875, 6.658935546875, 7.44482421875, 8.230712890625, 9.0166015625, 9.802490234375, 10.58837890625, 11.374267578125, 12.16015625, 12.946044921875, 13.73193359375, 14.517822265625, 15.3037109375, 16.089599609375, 16.87548828125, 17.661376953125, 18.447265625, 19.233154296875, 20.01904296875, 20.804931640625, 21.5908203125, 22.376708984375, 23.16259765625, 23.948486328125, 24.734375]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 1.0, 5.0, 8.0, 13.0, 16.0, 18.0, 16.0, 13.0, 33.0, 43.0, 44.0, 70.0, 95.0, 109.0, 157.0, 192.0, 347.0, 688.0, 4150.0, 514004.0, 2615017.0, 8342.0, 982.0, 430.0, 257.0, 149.0, 125.0, 83.0, 56.0, 55.0, 38.0, 42.0, 21.0, 15.0, 16.0, 10.0, 9.0, 7.0, 4.0, 2.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.15625, -36.9296875, -35.703125, -34.4765625, -33.25, -32.0234375, -30.796875, -29.5703125, -28.34375, -27.1171875, -25.890625, -24.6640625, -23.4375, -22.2109375, -20.984375, -19.7578125, -18.53125, -17.3046875, -16.078125, -14.8515625, -13.625, -12.3984375, -11.171875, -9.9453125, -8.71875, -7.4921875, -6.265625, -5.0390625, -3.8125, -2.5859375, -1.359375, -0.1328125, 1.09375, 2.3203125, 3.546875, 4.7734375, 6.0, 7.2265625, 8.453125, 9.6796875, 10.90625, 12.1328125, 13.359375, 14.5859375, 15.8125, 17.0390625, 18.265625, 19.4921875, 20.71875, 21.9453125, 23.171875, 24.3984375, 25.625, 26.8515625, 28.078125, 29.3046875, 30.53125, 31.7578125, 32.984375, 34.2109375, 35.4375, 36.6640625, 37.890625, 39.1171875, 40.34375]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 254.0, 677.0, 80.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.110538482666016, -54.985137939453125, -50.8597412109375, -46.73434066772461, -42.60894012451172, -38.483543395996094, -34.3581428527832, -30.232744216918945, -26.107345581054688, -21.98194694519043, -17.856548309326172, -13.731147766113281, -9.605749130249023, -5.480350494384766, -1.354949951171875, 2.770448684692383, 6.895847320556641, 11.021245956420898, 15.146645545959473, 19.272045135498047, 23.397443771362305, 27.522842407226562, 31.648242950439453, 35.773643493652344, 39.89904022216797, 44.02444076538086, 48.149837493896484, 52.275238037109375, 56.400634765625, 60.52603530883789, 64.65143585205078, 68.7768325805664, 72.90223693847656, 77.02763366699219, 81.15303802490234, 85.27843475341797, 89.4038314819336, 93.52923583984375, 97.65463256835938, 101.780029296875, 105.90542602539062, 110.03082275390625, 114.1562271118164, 118.28162384033203, 122.40702056884766, 126.53242492675781, 130.65782165527344, 134.78321838378906, 138.90863037109375, 143.03402709960938, 147.159423828125, 151.28482055664062, 155.4102325439453, 159.53562927246094, 163.66102600097656, 167.7864227294922, 171.9118194580078, 176.03721618652344, 180.16261291503906, 184.28802490234375, 188.41342163085938, 192.538818359375, 196.66421508789062, 200.78961181640625, 204.91500854492188]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 2.0, 4.0, 6.0, 7.0, 8.0, 9.0, 10.0, 11.0, 14.0, 21.0, 26.0, 17.0, 19.0, 27.0, 26.0, 32.0, 31.0, 32.0, 38.0, 33.0, 41.0, 32.0, 49.0, 35.0, 43.0, 39.0, 46.0, 32.0, 25.0, 28.0, 26.0, 35.0, 27.0, 36.0, 28.0, 12.0, 24.0, 11.0, 10.0, 10.0, 8.0, 4.0, 7.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0], "bins": [-53.394432067871094, -51.69292068481445, -49.99140548706055, -48.289894104003906, -46.588382720947266, -44.886871337890625, -43.18535614013672, -41.48384475708008, -39.78233337402344, -38.0808219909668, -36.37930679321289, -34.67779541015625, -32.97628402709961, -31.274770736694336, -29.573257446289062, -27.871746063232422, -26.170230865478516, -24.468717575073242, -22.7672061920166, -21.065692901611328, -19.364181518554688, -17.662668228149414, -15.96115493774414, -14.259642601013184, -12.558130264282227, -10.85661792755127, -9.155105590820312, -7.453592300415039, -5.752079963684082, -4.050567626953125, -2.3490543365478516, -0.6475419998168945, 1.0539665222167969, 2.755479097366333, 4.456991672515869, 6.158504486083984, 7.860016822814941, 9.561529159545898, 11.263042449951172, 12.964554786682129, 14.666067123413086, 16.36758041381836, 18.069091796875, 19.770605087280273, 21.472118377685547, 23.173629760742188, 24.87514305114746, 26.576656341552734, 28.278167724609375, 29.97968101501465, 31.68119239807129, 33.38270568847656, 35.0842170715332, 36.785728454589844, 38.48724365234375, 40.18875503540039, 41.89026641845703, 43.59177780151367, 45.29329299926758, 46.99480438232422, 48.69631576538086, 50.3978271484375, 52.099342346191406, 53.80085372924805, 55.50236892700195]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 5.0, 3.0, 3.0, 6.0, 9.0, 7.0, 11.0, 19.0, 12.0, 17.0, 14.0, 26.0, 25.0, 22.0, 10.0, 31.0, 39.0, 29.0, 37.0, 35.0, 21.0, 31.0, 17.0, 21.0, 34.0, 37.0, 32.0, 38.0, 33.0, 43.0, 32.0, 32.0, 31.0, 19.0, 31.0, 14.0, 26.0, 20.0, 16.0, 13.0, 19.0, 13.0, 17.0, 4.0, 9.0, 11.0, 2.0, 6.0, 1.0, 3.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-5.828125, -5.63934326171875, -5.4505615234375, -5.26177978515625, -5.072998046875, -4.88421630859375, -4.6954345703125, -4.50665283203125, -4.31787109375, -4.12908935546875, -3.9403076171875, -3.75152587890625, -3.562744140625, -3.37396240234375, -3.1851806640625, -2.99639892578125, -2.8076171875, -2.61883544921875, -2.4300537109375, -2.24127197265625, -2.052490234375, -1.86370849609375, -1.6749267578125, -1.48614501953125, -1.29736328125, -1.10858154296875, -0.9197998046875, -0.73101806640625, -0.542236328125, -0.35345458984375, -0.1646728515625, 0.02410888671875, 0.212890625, 0.40167236328125, 0.5904541015625, 0.77923583984375, 0.968017578125, 1.15679931640625, 1.3455810546875, 1.53436279296875, 1.72314453125, 1.91192626953125, 2.1007080078125, 2.28948974609375, 2.478271484375, 2.66705322265625, 2.8558349609375, 3.04461669921875, 3.2333984375, 3.42218017578125, 3.6109619140625, 3.79974365234375, 3.988525390625, 4.17730712890625, 4.3660888671875, 4.55487060546875, 4.74365234375, 4.93243408203125, 5.1212158203125, 5.30999755859375, 5.498779296875, 5.68756103515625, 5.8763427734375, 6.06512451171875, 6.25390625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 4.0, 11.0, 6.0, 10.0, 20.0, 17.0, 28.0, 27.0, 38.0, 41.0, 51.0, 59.0, 77.0, 88.0, 145.0, 353.0, 1463.0, 12450.0, 494253.0, 3466239.0, 209634.0, 7316.0, 1023.0, 302.0, 148.0, 95.0, 67.0, 58.0, 42.0, 40.0, 34.0, 17.0, 17.0, 11.0, 14.0, 17.0, 11.0, 8.0, 13.0, 6.0, 11.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.25, -21.466552734375, -20.68310546875, -19.899658203125, -19.1162109375, -18.332763671875, -17.54931640625, -16.765869140625, -15.982421875, -15.198974609375, -14.41552734375, -13.632080078125, -12.8486328125, -12.065185546875, -11.28173828125, -10.498291015625, -9.71484375, -8.931396484375, -8.14794921875, -7.364501953125, -6.5810546875, -5.797607421875, -5.01416015625, -4.230712890625, -3.447265625, -2.663818359375, -1.88037109375, -1.096923828125, -0.3134765625, 0.469970703125, 1.25341796875, 2.036865234375, 2.8203125, 3.603759765625, 4.38720703125, 5.170654296875, 5.9541015625, 6.737548828125, 7.52099609375, 8.304443359375, 9.087890625, 9.871337890625, 10.65478515625, 11.438232421875, 12.2216796875, 13.005126953125, 13.78857421875, 14.572021484375, 15.35546875, 16.138916015625, 16.92236328125, 17.705810546875, 18.4892578125, 19.272705078125, 20.05615234375, 20.839599609375, 21.623046875, 22.406494140625, 23.18994140625, 23.973388671875, 24.7568359375, 25.540283203125, 26.32373046875, 27.107177734375, 27.890625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 8.0, 11.0, 15.0, 25.0, 31.0, 33.0, 53.0, 77.0, 98.0, 135.0, 188.0, 292.0, 400.0, 468.0, 534.0, 462.0, 381.0, 244.0, 180.0, 124.0, 82.0, 69.0, 48.0, 41.0, 23.0, 17.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.359375, -10.927978515625, -10.49658203125, -10.065185546875, -9.6337890625, -9.202392578125, -8.77099609375, -8.339599609375, -7.908203125, -7.476806640625, -7.04541015625, -6.614013671875, -6.1826171875, -5.751220703125, -5.31982421875, -4.888427734375, -4.45703125, -4.025634765625, -3.59423828125, -3.162841796875, -2.7314453125, -2.300048828125, -1.86865234375, -1.437255859375, -1.005859375, -0.574462890625, -0.14306640625, 0.288330078125, 0.7197265625, 1.151123046875, 1.58251953125, 2.013916015625, 2.4453125, 2.876708984375, 3.30810546875, 3.739501953125, 4.1708984375, 4.602294921875, 5.03369140625, 5.465087890625, 5.896484375, 6.327880859375, 6.75927734375, 7.190673828125, 7.6220703125, 8.053466796875, 8.48486328125, 8.916259765625, 9.34765625, 9.779052734375, 10.21044921875, 10.641845703125, 11.0732421875, 11.504638671875, 11.93603515625, 12.367431640625, 12.798828125, 13.230224609375, 13.66162109375, 14.093017578125, 14.5244140625, 14.955810546875, 15.38720703125, 15.818603515625, 16.25]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 10.0, 7.0, 12.0, 11.0, 14.0, 25.0, 36.0, 41.0, 73.0, 64.0, 87.0, 130.0, 160.0, 247.0, 358.0, 734.0, 3898.0, 679255.0, 3497461.0, 9211.0, 994.0, 399.0, 233.0, 173.0, 143.0, 110.0, 87.0, 68.0, 49.0, 48.0, 39.0, 26.0, 21.0, 10.0, 14.0, 8.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0], "bins": [-77.125, -75.203125, -73.28125, -71.359375, -69.4375, -67.515625, -65.59375, -63.671875, -61.75, -59.828125, -57.90625, -55.984375, -54.0625, -52.140625, -50.21875, -48.296875, -46.375, -44.453125, -42.53125, -40.609375, -38.6875, -36.765625, -34.84375, -32.921875, -31.0, -29.078125, -27.15625, -25.234375, -23.3125, -21.390625, -19.46875, -17.546875, -15.625, -13.703125, -11.78125, -9.859375, -7.9375, -6.015625, -4.09375, -2.171875, -0.25, 1.671875, 3.59375, 5.515625, 7.4375, 9.359375, 11.28125, 13.203125, 15.125, 17.046875, 18.96875, 20.890625, 22.8125, 24.734375, 26.65625, 28.578125, 30.5, 32.421875, 34.34375, 36.265625, 38.1875, 40.109375, 42.03125, 43.953125, 45.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 72.0, 500.0, 395.0, 44.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.8634490966797, -136.6352081298828, -129.40696716308594, -122.1787338256836, -114.95049285888672, -107.72225189208984, -100.4940185546875, -93.26577758789062, -86.03753662109375, -78.80929565429688, -71.5810546875, -64.35282135009766, -57.12458038330078, -49.896339416503906, -42.6681022644043, -35.43986511230469, -28.211624145507812, -20.98338508605957, -13.755146026611328, -6.526906967163086, 0.7013320922851562, 7.929573059082031, 15.15781021118164, 22.38604736328125, 29.614288330078125, 36.842529296875, 44.07076644897461, 51.29900360107422, 58.527244567871094, 65.75548553466797, 72.98371887207031, 80.21195983886719, 87.44021606445312, 94.66845703125, 101.89669799804688, 109.12493133544922, 116.3531723022461, 123.58141326904297, 130.8096466064453, 138.0378875732422, 145.26612854003906, 152.49436950683594, 159.7226104736328, 166.9508514404297, 174.1790771484375, 181.40731811523438, 188.63555908203125, 195.86380004882812, 203.092041015625, 210.32028198242188, 217.54852294921875, 224.77676391601562, 232.0050048828125, 239.23324584960938, 246.4614715576172, 253.68971252441406, 260.91796875, 268.1462097167969, 275.37445068359375, 282.6026916503906, 289.8309326171875, 297.0591735839844, 304.28741455078125, 311.515625, 318.7438659667969]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 11.0, 7.0, 10.0, 10.0, 12.0, 9.0, 24.0, 15.0, 23.0, 32.0, 21.0, 33.0, 25.0, 40.0, 38.0, 35.0, 48.0, 35.0, 29.0, 46.0, 31.0, 38.0, 42.0, 39.0, 35.0, 33.0, 31.0, 28.0, 26.0, 23.0, 23.0, 20.0, 13.0, 9.0, 15.0, 13.0, 11.0, 3.0, 9.0, 7.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-33.45185852050781, -32.26116180419922, -31.070465087890625, -29.87976837158203, -28.689071655273438, -27.498374938964844, -26.307676315307617, -25.116979598999023, -23.92628288269043, -22.735586166381836, -21.544889450073242, -20.35419273376465, -19.163494110107422, -17.972797393798828, -16.782100677490234, -15.59140396118164, -14.400707244873047, -13.210010528564453, -12.01931381225586, -10.82861614227295, -9.637919425964355, -8.447222709655762, -7.25652551651001, -6.065828323364258, -4.875131607055664, -3.684434652328491, -2.4937376976013184, -1.3030407428741455, -0.11234378814697266, 1.078352928161621, 2.269050121307373, 3.459747314453125, 4.650444030761719, 5.8411407470703125, 7.0318379402160645, 8.222535133361816, 9.41323184967041, 10.603928565979004, 11.794626235961914, 12.985322952270508, 14.176019668579102, 15.366716384887695, 16.55741310119629, 17.748109817504883, 18.93880844116211, 20.129505157470703, 21.320201873779297, 22.51089859008789, 23.701595306396484, 24.892292022705078, 26.082988739013672, 27.273685455322266, 28.46438217163086, 29.655078887939453, 30.84577751159668, 32.036476135253906, 33.2271728515625, 34.417869567871094, 35.60856628417969, 36.79926300048828, 37.989959716796875, 39.18065643310547, 40.37135314941406, 41.562049865722656, 42.75274658203125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 9.0, 11.0, 14.0, 19.0, 26.0, 25.0, 20.0, 27.0, 21.0, 30.0, 24.0, 41.0, 38.0, 27.0, 25.0, 48.0, 36.0, 43.0, 37.0, 37.0, 33.0, 35.0, 39.0, 34.0, 23.0, 46.0, 40.0, 18.0, 10.0, 32.0, 17.0, 22.0, 8.0, 11.0, 13.0, 10.0, 9.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.5496826171875, -6.329833984375, -6.1099853515625, -5.89013671875, -5.6702880859375, -5.450439453125, -5.2305908203125, -5.0107421875, -4.7908935546875, -4.571044921875, -4.3511962890625, -4.13134765625, -3.9114990234375, -3.691650390625, -3.4718017578125, -3.251953125, -3.0321044921875, -2.812255859375, -2.5924072265625, -2.37255859375, -2.1527099609375, -1.932861328125, -1.7130126953125, -1.4931640625, -1.2733154296875, -1.053466796875, -0.8336181640625, -0.61376953125, -0.3939208984375, -0.174072265625, 0.0457763671875, 0.265625, 0.4854736328125, 0.705322265625, 0.9251708984375, 1.14501953125, 1.3648681640625, 1.584716796875, 1.8045654296875, 2.0244140625, 2.2442626953125, 2.464111328125, 2.6839599609375, 2.90380859375, 3.1236572265625, 3.343505859375, 3.5633544921875, 3.783203125, 4.0030517578125, 4.222900390625, 4.4427490234375, 4.66259765625, 4.8824462890625, 5.102294921875, 5.3221435546875, 5.5419921875, 5.7618408203125, 5.981689453125, 6.2015380859375, 6.42138671875, 6.6412353515625, 6.861083984375, 7.0809326171875, 7.30078125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 5.0, 12.0, 13.0, 18.0, 33.0, 44.0, 62.0, 91.0, 147.0, 215.0, 307.0, 436.0, 672.0, 979.0, 1387.0, 2052.0, 3094.0, 4474.0, 6664.0, 9521.0, 14174.0, 20530.0, 29955.0, 44731.0, 67757.0, 113187.0, 258310.0, 192862.0, 94205.0, 59260.0, 39550.0, 26324.0, 18162.0, 12390.0, 8544.0, 5934.0, 3936.0, 2743.0, 1845.0, 1280.0, 862.0, 570.0, 396.0, 249.0, 199.0, 123.0, 89.0, 57.0, 35.0, 23.0, 21.0, 12.0, 10.0, 8.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1943359375, -1.155609130859375, -1.11688232421875, -1.078155517578125, -1.0394287109375, -1.000701904296875, -0.96197509765625, -0.923248291015625, -0.884521484375, -0.845794677734375, -0.80706787109375, -0.768341064453125, -0.7296142578125, -0.690887451171875, -0.65216064453125, -0.613433837890625, -0.57470703125, -0.535980224609375, -0.49725341796875, -0.458526611328125, -0.4197998046875, -0.381072998046875, -0.34234619140625, -0.303619384765625, -0.264892578125, -0.226165771484375, -0.18743896484375, -0.148712158203125, -0.1099853515625, -0.071258544921875, -0.03253173828125, 0.006195068359375, 0.044921875, 0.083648681640625, 0.12237548828125, 0.161102294921875, 0.1998291015625, 0.238555908203125, 0.27728271484375, 0.316009521484375, 0.354736328125, 0.393463134765625, 0.43218994140625, 0.470916748046875, 0.5096435546875, 0.548370361328125, 0.58709716796875, 0.625823974609375, 0.66455078125, 0.703277587890625, 0.74200439453125, 0.780731201171875, 0.8194580078125, 0.858184814453125, 0.89691162109375, 0.935638427734375, 0.974365234375, 1.013092041015625, 1.05181884765625, 1.090545654296875, 1.1292724609375, 1.167999267578125, 1.20672607421875, 1.245452880859375, 1.2841796875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 11.0, 5.0, 8.0, 15.0, 10.0, 15.0, 14.0, 18.0, 24.0, 28.0, 15.0, 24.0, 36.0, 26.0, 31.0, 36.0, 33.0, 40.0, 28.0, 42.0, 1071.0, 41.0, 39.0, 41.0, 45.0, 35.0, 23.0, 34.0, 34.0, 26.0, 30.0, 21.0, 18.0, 10.0, 17.0, 18.0, 17.0, 10.0, 12.0, 6.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.80859375, -4.661865234375, -4.51513671875, -4.368408203125, -4.2216796875, -4.074951171875, -3.92822265625, -3.781494140625, -3.634765625, -3.488037109375, -3.34130859375, -3.194580078125, -3.0478515625, -2.901123046875, -2.75439453125, -2.607666015625, -2.4609375, -2.314208984375, -2.16748046875, -2.020751953125, -1.8740234375, -1.727294921875, -1.58056640625, -1.433837890625, -1.287109375, -1.140380859375, -0.99365234375, -0.846923828125, -0.7001953125, -0.553466796875, -0.40673828125, -0.260009765625, -0.11328125, 0.033447265625, 0.18017578125, 0.326904296875, 0.4736328125, 0.620361328125, 0.76708984375, 0.913818359375, 1.060546875, 1.207275390625, 1.35400390625, 1.500732421875, 1.6474609375, 1.794189453125, 1.94091796875, 2.087646484375, 2.234375, 2.381103515625, 2.52783203125, 2.674560546875, 2.8212890625, 2.968017578125, 3.11474609375, 3.261474609375, 3.408203125, 3.554931640625, 3.70166015625, 3.848388671875, 3.9951171875, 4.141845703125, 4.28857421875, 4.435302734375, 4.58203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 4.0, 4.0, 6.0, 7.0, 11.0, 19.0, 21.0, 28.0, 46.0, 68.0, 126.0, 231.0, 442.0, 840.0, 1663.0, 2957.0, 5779.0, 11010.0, 21760.0, 42273.0, 89098.0, 248112.0, 1443678.0, 119050.0, 53775.0, 27047.0, 13950.0, 7075.0, 3756.0, 2014.0, 1033.0, 555.0, 267.0, 171.0, 89.0, 53.0, 36.0, 17.0, 13.0, 16.0, 10.0, 9.0, 8.0, 2.0, 1.0, 1.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.236328125, -2.164581298828125, -2.09283447265625, -2.021087646484375, -1.9493408203125, -1.877593994140625, -1.80584716796875, -1.734100341796875, -1.662353515625, -1.590606689453125, -1.51885986328125, -1.447113037109375, -1.3753662109375, -1.303619384765625, -1.23187255859375, -1.160125732421875, -1.08837890625, -1.016632080078125, -0.94488525390625, -0.873138427734375, -0.8013916015625, -0.729644775390625, -0.65789794921875, -0.586151123046875, -0.514404296875, -0.442657470703125, -0.37091064453125, -0.299163818359375, -0.2274169921875, -0.155670166015625, -0.08392333984375, -0.012176513671875, 0.0595703125, 0.131317138671875, 0.20306396484375, 0.274810791015625, 0.3465576171875, 0.418304443359375, 0.49005126953125, 0.561798095703125, 0.633544921875, 0.705291748046875, 0.77703857421875, 0.848785400390625, 0.9205322265625, 0.992279052734375, 1.06402587890625, 1.135772705078125, 1.20751953125, 1.279266357421875, 1.35101318359375, 1.422760009765625, 1.4945068359375, 1.566253662109375, 1.63800048828125, 1.709747314453125, 1.781494140625, 1.853240966796875, 1.92498779296875, 1.996734619140625, 2.0684814453125, 2.140228271484375, 2.21197509765625, 2.283721923828125, 2.35546875]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 8.0, 5.0, 4.0, 7.0, 9.0, 19.0, 16.0, 26.0, 30.0, 38.0, 46.0, 52.0, 65.0, 51.0, 73.0, 77.0, 76.0, 65.0, 53.0, 48.0, 43.0, 38.0, 30.0, 17.0, 10.0, 19.0, 10.0, 12.0, 10.0, 8.0, 7.0, 4.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0007491111755371094, -0.000723712146282196, -0.0006983131170272827, -0.0006729140877723694, -0.0006475150585174561, -0.0006221160292625427, -0.0005967170000076294, -0.0005713179707527161, -0.0005459189414978027, -0.0005205199122428894, -0.0004951208829879761, -0.00046972185373306274, -0.0004443228244781494, -0.0004189237952232361, -0.00039352476596832275, -0.0003681257367134094, -0.0003427267074584961, -0.00031732767820358276, -0.00029192864894866943, -0.0002665296196937561, -0.00024113059043884277, -0.00021573156118392944, -0.0001903325319290161, -0.00016493350267410278, -0.00013953447341918945, -0.00011413544416427612, -8.873641490936279e-05, -6.333738565444946e-05, -3.793835639953613e-05, -1.2539327144622803e-05, 1.2859702110290527e-05, 3.825873136520386e-05, 6.365776062011719e-05, 8.905678987503052e-05, 0.00011445581912994385, 0.00013985484838485718, 0.0001652538776397705, 0.00019065290689468384, 0.00021605193614959717, 0.0002414509654045105, 0.00026684999465942383, 0.00029224902391433716, 0.0003176480531692505, 0.0003430470824241638, 0.00036844611167907715, 0.0003938451409339905, 0.0004192441701889038, 0.00044464319944381714, 0.00047004222869873047, 0.0004954412579536438, 0.0005208402872085571, 0.0005462393164634705, 0.0005716383457183838, 0.0005970373749732971, 0.0006224364042282104, 0.0006478354334831238, 0.0006732344627380371, 0.0006986334919929504, 0.0007240325212478638, 0.0007494315505027771, 0.0007748305797576904, 0.0008002296090126038, 0.0008256286382675171, 0.0008510276675224304, 0.0008764266967773438]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 4.0, 7.0, 6.0, 11.0, 10.0, 14.0, 24.0, 23.0, 47.0, 53.0, 99.0, 99.0, 188.0, 465.0, 5139.0, 1037922.0, 3461.0, 419.0, 182.0, 108.0, 74.0, 56.0, 42.0, 29.0, 15.0, 10.0, 10.0, 6.0, 10.0, 4.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0266265869140625, -0.025896310806274414, -0.025166034698486328, -0.024435758590698242, -0.023705482482910156, -0.02297520637512207, -0.022244930267333984, -0.0215146541595459, -0.020784378051757812, -0.020054101943969727, -0.01932382583618164, -0.018593549728393555, -0.01786327362060547, -0.017132997512817383, -0.016402721405029297, -0.01567244529724121, -0.014942169189453125, -0.014211893081665039, -0.013481616973876953, -0.012751340866088867, -0.012021064758300781, -0.011290788650512695, -0.01056051254272461, -0.009830236434936523, -0.009099960327148438, -0.008369684219360352, -0.007639408111572266, -0.00690913200378418, -0.006178855895996094, -0.005448579788208008, -0.004718303680419922, -0.003988027572631836, -0.00325775146484375, -0.002527475357055664, -0.0017971992492675781, -0.0010669231414794922, -0.00033664703369140625, 0.0003936290740966797, 0.0011239051818847656, 0.0018541812896728516, 0.0025844573974609375, 0.0033147335052490234, 0.004045009613037109, 0.004775285720825195, 0.005505561828613281, 0.006235837936401367, 0.006966114044189453, 0.007696390151977539, 0.008426666259765625, 0.009156942367553711, 0.009887218475341797, 0.010617494583129883, 0.011347770690917969, 0.012078046798706055, 0.01280832290649414, 0.013538599014282227, 0.014268875122070312, 0.014999151229858398, 0.015729427337646484, 0.01645970344543457, 0.017189979553222656, 0.017920255661010742, 0.018650531768798828, 0.019380807876586914, 0.020111083984375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 6.0, 30.0, 55.0, 177.0, 254.0, 250.0, 154.0, 69.0, 16.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000304760062135756, -0.00026627344777807593, -0.00022778681886848062, -0.0001893001899588853, -0.00015081357560120523, -0.00011232696124352515, -7.384033233392984e-05, -3.5353703424334526e-05, 3.1329109333455563e-06, 4.161953256698325e-05, 8.010615420062095e-05, 0.00011859277583425865, 0.00015707939746789634, 0.00019556601182557642, 0.00023405264073517174, 0.00027253926964476705, 0.00031102588400244713, 0.0003495124983601272, 0.0003879991127178073, 0.00042648575617931783, 0.0004649723705369979, 0.0005034590139985085, 0.0005419456283561885, 0.0005804322427138686, 0.0006189188570715487, 0.0006574054714292288, 0.0006958920857869089, 0.000734378700144589, 0.0007728653727099299, 0.0008113519288599491, 0.0008498386014252901, 0.0008883252157829702, 0.0009268117137253284, 0.0009652983280830085, 0.0010037849424406886, 0.0010422716150060296, 0.0010807581711560488, 0.0011192448437213898, 0.001157731399871409, 0.00119621807243675, 0.001234704628586769, 0.00127319130115211, 0.0013116778573021293, 0.0013501645298674703, 0.0013886510860174894, 0.0014271377585828304, 0.0014656243147328496, 0.0015041109872981906, 0.0015425976598635316, 0.0015810843324288726, 0.0016195708885788918, 0.0016580575611442327, 0.001696544117294252, 0.001735030789859593, 0.001773517346009612, 0.001812004018574953, 0.001850490691140294, 0.001888977363705635, 0.0019274639198556542, 0.0019659504760056734, 0.0020044371485710144, 0.0020429238211363554, 0.0020814104937016964, 0.0021198969334363937, 0.0021583836060017347]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 7.0, 2.0, 9.0, 13.0, 19.0, 18.0, 13.0, 25.0, 25.0, 19.0, 29.0, 26.0, 41.0, 43.0, 34.0, 39.0, 37.0, 35.0, 39.0, 46.0, 49.0, 35.0, 50.0, 41.0, 38.0, 26.0, 35.0, 32.0, 27.0, 20.0, 24.0, 28.0, 16.0, 13.0, 10.0, 7.0, 4.0, 6.0, 7.0, 3.0, 4.0, 8.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004375576972961426, -0.0004243878647685051, -0.0004112180322408676, -0.00039804819971323013, -0.00038487836718559265, -0.00037170853465795517, -0.0003585387021303177, -0.0003453688696026802, -0.0003321990370750427, -0.00031902920454740524, -0.00030585937201976776, -0.0002926895394921303, -0.0002795197069644928, -0.0002663498744368553, -0.00025318004190921783, -0.00024001020938158035, -0.00022684037685394287, -0.0002136705443263054, -0.0002005007117986679, -0.00018733087927103043, -0.00017416104674339294, -0.00016099121421575546, -0.00014782138168811798, -0.0001346515491604805, -0.00012148171663284302, -0.00010831188410520554, -9.514205157756805e-05, -8.197221904993057e-05, -6.880238652229309e-05, -5.563255399465561e-05, -4.246272146701813e-05, -2.9292888939380646e-05, -1.6123056411743164e-05, -2.9532238841056824e-06, 1.02166086435318e-05, 2.338644117116928e-05, 3.655627369880676e-05, 4.9726106226444244e-05, 6.289593875408173e-05, 7.606577128171921e-05, 8.923560380935669e-05, 0.00010240543633699417, 0.00011557526886463165, 0.00012874510139226913, 0.00014191493391990662, 0.0001550847664475441, 0.00016825459897518158, 0.00018142443150281906, 0.00019459426403045654, 0.00020776409655809402, 0.0002209339290857315, 0.000234103761613369, 0.00024727359414100647, 0.00026044342666864395, 0.00027361325919628143, 0.0002867830917239189, 0.0002999529242515564, 0.0003131227567791939, 0.00032629258930683136, 0.00033946242183446884, 0.0003526322543621063, 0.0003658020868897438, 0.0003789719194173813, 0.00039214175194501877, 0.00040531158447265625]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 8.0, 7.0, 9.0, 11.0, 14.0, 19.0, 26.0, 25.0, 20.0, 27.0, 21.0, 30.0, 24.0, 41.0, 38.0, 27.0, 25.0, 48.0, 36.0, 43.0, 37.0, 37.0, 33.0, 35.0, 39.0, 34.0, 23.0, 46.0, 40.0, 18.0, 10.0, 32.0, 17.0, 22.0, 8.0, 11.0, 13.0, 10.0, 9.0, 8.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.76953125, -6.5496826171875, -6.329833984375, -6.1099853515625, -5.89013671875, -5.6702880859375, -5.450439453125, -5.2305908203125, -5.0107421875, -4.7908935546875, -4.571044921875, -4.3511962890625, -4.13134765625, -3.9114990234375, -3.691650390625, -3.4718017578125, -3.251953125, -3.0321044921875, -2.812255859375, -2.5924072265625, -2.37255859375, -2.1527099609375, -1.932861328125, -1.7130126953125, -1.4931640625, -1.2733154296875, -1.053466796875, -0.8336181640625, -0.61376953125, -0.3939208984375, -0.174072265625, 0.0457763671875, 0.265625, 0.4854736328125, 0.705322265625, 0.9251708984375, 1.14501953125, 1.3648681640625, 1.584716796875, 1.8045654296875, 2.0244140625, 2.2442626953125, 2.464111328125, 2.6839599609375, 2.90380859375, 3.1236572265625, 3.343505859375, 3.5633544921875, 3.783203125, 4.0030517578125, 4.222900390625, 4.4427490234375, 4.66259765625, 4.8824462890625, 5.102294921875, 5.3221435546875, 5.5419921875, 5.7618408203125, 5.981689453125, 6.2015380859375, 6.42138671875, 6.6412353515625, 6.861083984375, 7.0809326171875, 7.30078125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 10.0, 4.0, 10.0, 18.0, 12.0, 18.0, 30.0, 43.0, 43.0, 55.0, 64.0, 93.0, 131.0, 204.0, 345.0, 569.0, 1324.0, 5668.0, 34841.0, 259560.0, 630966.0, 95610.0, 14120.0, 2693.0, 825.0, 389.0, 244.0, 175.0, 140.0, 85.0, 42.0, 54.0, 47.0, 23.0, 18.0, 15.0, 13.0, 14.0, 6.0, 14.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4921875, -13.060546875, -12.62890625, -12.197265625, -11.765625, -11.333984375, -10.90234375, -10.470703125, -10.0390625, -9.607421875, -9.17578125, -8.744140625, -8.3125, -7.880859375, -7.44921875, -7.017578125, -6.5859375, -6.154296875, -5.72265625, -5.291015625, -4.859375, -4.427734375, -3.99609375, -3.564453125, -3.1328125, -2.701171875, -2.26953125, -1.837890625, -1.40625, -0.974609375, -0.54296875, -0.111328125, 0.3203125, 0.751953125, 1.18359375, 1.615234375, 2.046875, 2.478515625, 2.91015625, 3.341796875, 3.7734375, 4.205078125, 4.63671875, 5.068359375, 5.5, 5.931640625, 6.36328125, 6.794921875, 7.2265625, 7.658203125, 8.08984375, 8.521484375, 8.953125, 9.384765625, 9.81640625, 10.248046875, 10.6796875, 11.111328125, 11.54296875, 11.974609375, 12.40625, 12.837890625, 13.26953125, 13.701171875, 14.1328125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 4.0, 3.0, 10.0, 13.0, 13.0, 19.0, 27.0, 24.0, 33.0, 35.0, 37.0, 55.0, 53.0, 48.0, 70.0, 144.0, 1521.0, 404.0, 116.0, 70.0, 53.0, 46.0, 43.0, 28.0, 32.0, 25.0, 30.0, 24.0, 17.0, 13.0, 9.0, 5.0, 6.0, 1.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.25, -27.3916015625, -26.533203125, -25.6748046875, -24.81640625, -23.9580078125, -23.099609375, -22.2412109375, -21.3828125, -20.5244140625, -19.666015625, -18.8076171875, -17.94921875, -17.0908203125, -16.232421875, -15.3740234375, -14.515625, -13.6572265625, -12.798828125, -11.9404296875, -11.08203125, -10.2236328125, -9.365234375, -8.5068359375, -7.6484375, -6.7900390625, -5.931640625, -5.0732421875, -4.21484375, -3.3564453125, -2.498046875, -1.6396484375, -0.78125, 0.0771484375, 0.935546875, 1.7939453125, 2.65234375, 3.5107421875, 4.369140625, 5.2275390625, 6.0859375, 6.9443359375, 7.802734375, 8.6611328125, 9.51953125, 10.3779296875, 11.236328125, 12.0947265625, 12.953125, 13.8115234375, 14.669921875, 15.5283203125, 16.38671875, 17.2451171875, 18.103515625, 18.9619140625, 19.8203125, 20.6787109375, 21.537109375, 22.3955078125, 23.25390625, 24.1123046875, 24.970703125, 25.8291015625, 26.6875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 7.0, 1.0, 3.0, 9.0, 10.0, 17.0, 20.0, 27.0, 32.0, 39.0, 45.0, 66.0, 103.0, 139.0, 238.0, 613.0, 2780.0, 392421.0, 2743109.0, 4347.0, 765.0, 297.0, 182.0, 115.0, 72.0, 54.0, 40.0, 36.0, 35.0, 22.0, 15.0, 12.0, 10.0, 4.0, 2.0, 7.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-61.25, -59.2802734375, -57.310546875, -55.3408203125, -53.37109375, -51.4013671875, -49.431640625, -47.4619140625, -45.4921875, -43.5224609375, -41.552734375, -39.5830078125, -37.61328125, -35.6435546875, -33.673828125, -31.7041015625, -29.734375, -27.7646484375, -25.794921875, -23.8251953125, -21.85546875, -19.8857421875, -17.916015625, -15.9462890625, -13.9765625, -12.0068359375, -10.037109375, -8.0673828125, -6.09765625, -4.1279296875, -2.158203125, -0.1884765625, 1.78125, 3.7509765625, 5.720703125, 7.6904296875, 9.66015625, 11.6298828125, 13.599609375, 15.5693359375, 17.5390625, 19.5087890625, 21.478515625, 23.4482421875, 25.41796875, 27.3876953125, 29.357421875, 31.3271484375, 33.296875, 35.2666015625, 37.236328125, 39.2060546875, 41.17578125, 43.1455078125, 45.115234375, 47.0849609375, 49.0546875, 51.0244140625, 52.994140625, 54.9638671875, 56.93359375, 58.9033203125, 60.873046875, 62.8427734375, 64.8125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 91.0, 920.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-754.56494140625, -741.61279296875, -728.66064453125, -715.70849609375, -702.7562866210938, -689.8041381835938, -676.8519897460938, -663.8998413085938, -650.9476928710938, -637.9955444335938, -625.0433959960938, -612.0912475585938, -599.1390380859375, -586.1868896484375, -573.2347412109375, -560.2825927734375, -547.3304443359375, -534.3782958984375, -521.4261474609375, -508.4739685058594, -495.5218200683594, -482.56964111328125, -469.61749267578125, -456.66534423828125, -443.7131652832031, -430.7610168457031, -417.808837890625, -404.856689453125, -391.904541015625, -378.952392578125, -366.0002136230469, -353.0480651855469, -340.09588623046875, -327.14373779296875, -314.1915588378906, -301.2394104003906, -288.2872619628906, -275.3350830078125, -262.3829345703125, -249.4307861328125, -236.4786376953125, -223.52647399902344, -210.57432556152344, -197.62216186523438, -184.67001342773438, -171.7178497314453, -158.76568603515625, -145.81353759765625, -132.86138916015625, -119.90923309326172, -106.95707702636719, -94.00491333007812, -81.05276489257812, -68.10060119628906, -55.14844512939453, -42.1962890625, -29.244125366210938, -16.291969299316406, -3.339811325073242, 9.612346649169922, 22.564502716064453, 35.51666259765625, 48.46881866455078, 61.42097473144531, 74.37313079833984]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 10.0, 9.0, 8.0, 14.0, 12.0, 13.0, 14.0, 7.0, 15.0, 19.0, 23.0, 27.0, 21.0, 24.0, 29.0, 37.0, 45.0, 53.0, 39.0, 46.0, 39.0, 38.0, 32.0, 41.0, 22.0, 37.0, 46.0, 25.0, 22.0, 26.0, 22.0, 28.0, 24.0, 20.0, 16.0, 12.0, 15.0, 8.0, 9.0, 4.0, 10.0, 9.0, 7.0, 4.0, 5.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-60.9410400390625, -59.06630325317383, -57.19157028198242, -55.31683349609375, -53.442100524902344, -51.56736373901367, -49.692626953125, -47.817893981933594, -45.94315719604492, -44.06842041015625, -42.193687438964844, -40.31895065307617, -38.444217681884766, -36.569480895996094, -34.69474792480469, -32.820011138916016, -30.945276260375977, -29.070541381835938, -27.1958065032959, -25.32107162475586, -23.446334838867188, -21.57159996032715, -19.69686508178711, -17.822128295898438, -15.947394371032715, -14.072659492492676, -12.19792366027832, -10.323188781738281, -8.448453903198242, -6.573718070983887, -4.698983192443848, -2.824247360229492, -0.9495124816894531, 0.9252227544784546, 2.7999579906463623, 4.6746931076049805, 6.549428462982178, 8.424163818359375, 10.298898696899414, 12.17363452911377, 14.048369407653809, 15.923104286193848, 17.797840118408203, 19.672574996948242, 21.54730987548828, 23.422046661376953, 25.29677963256836, 27.17151641845703, 29.04625129699707, 30.92098617553711, 32.79572296142578, 34.67045593261719, 36.54519271850586, 38.41992950439453, 40.29466247558594, 42.16939926147461, 44.044132232666016, 45.91886901855469, 47.793601989746094, 49.668338775634766, 51.54307174682617, 53.417808532714844, 55.29254150390625, 57.16727828979492, 59.042015075683594]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 3.0, 7.0, 2.0, 12.0, 11.0, 8.0, 19.0, 14.0, 17.0, 19.0, 25.0, 27.0, 28.0, 31.0, 28.0, 35.0, 31.0, 25.0, 30.0, 46.0, 42.0, 39.0, 30.0, 30.0, 51.0, 32.0, 27.0, 38.0, 34.0, 39.0, 31.0, 24.0, 24.0, 25.0, 15.0, 20.0, 10.0, 17.0, 16.0, 10.0, 7.0, 9.0, 3.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-7.8828125, -7.65179443359375, -7.4207763671875, -7.18975830078125, -6.958740234375, -6.72772216796875, -6.4967041015625, -6.26568603515625, -6.03466796875, -5.80364990234375, -5.5726318359375, -5.34161376953125, -5.110595703125, -4.87957763671875, -4.6485595703125, -4.41754150390625, -4.1865234375, -3.95550537109375, -3.7244873046875, -3.49346923828125, -3.262451171875, -3.03143310546875, -2.8004150390625, -2.56939697265625, -2.33837890625, -2.10736083984375, -1.8763427734375, -1.64532470703125, -1.414306640625, -1.18328857421875, -0.9522705078125, -0.72125244140625, -0.490234375, -0.25921630859375, -0.0281982421875, 0.20281982421875, 0.433837890625, 0.66485595703125, 0.8958740234375, 1.12689208984375, 1.35791015625, 1.58892822265625, 1.8199462890625, 2.05096435546875, 2.281982421875, 2.51300048828125, 2.7440185546875, 2.97503662109375, 3.2060546875, 3.43707275390625, 3.6680908203125, 3.89910888671875, 4.130126953125, 4.36114501953125, 4.5921630859375, 4.82318115234375, 5.05419921875, 5.28521728515625, 5.5162353515625, 5.74725341796875, 5.978271484375, 6.20928955078125, 6.4403076171875, 6.67132568359375, 6.90234375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 8.0, 8.0, 14.0, 8.0, 19.0, 11.0, 25.0, 28.0, 34.0, 30.0, 51.0, 59.0, 106.0, 156.0, 265.0, 657.0, 1986.0, 11185.0, 166957.0, 2748699.0, 1211384.0, 45161.0, 5109.0, 1203.0, 434.0, 197.0, 132.0, 71.0, 59.0, 46.0, 33.0, 27.0, 10.0, 14.0, 25.0, 14.0, 15.0, 8.0, 3.0, 8.0, 2.0, 6.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-22.59375, -21.90478515625, -21.2158203125, -20.52685546875, -19.837890625, -19.14892578125, -18.4599609375, -17.77099609375, -17.08203125, -16.39306640625, -15.7041015625, -15.01513671875, -14.326171875, -13.63720703125, -12.9482421875, -12.25927734375, -11.5703125, -10.88134765625, -10.1923828125, -9.50341796875, -8.814453125, -8.12548828125, -7.4365234375, -6.74755859375, -6.05859375, -5.36962890625, -4.6806640625, -3.99169921875, -3.302734375, -2.61376953125, -1.9248046875, -1.23583984375, -0.546875, 0.14208984375, 0.8310546875, 1.52001953125, 2.208984375, 2.89794921875, 3.5869140625, 4.27587890625, 4.96484375, 5.65380859375, 6.3427734375, 7.03173828125, 7.720703125, 8.40966796875, 9.0986328125, 9.78759765625, 10.4765625, 11.16552734375, 11.8544921875, 12.54345703125, 13.232421875, 13.92138671875, 14.6103515625, 15.29931640625, 15.98828125, 16.67724609375, 17.3662109375, 18.05517578125, 18.744140625, 19.43310546875, 20.1220703125, 20.81103515625, 21.5]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 9.0, 6.0, 11.0, 19.0, 46.0, 61.0, 93.0, 173.0, 267.0, 424.0, 680.0, 750.0, 670.0, 368.0, 223.0, 124.0, 58.0, 44.0, 19.0, 11.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.46875, -15.794677734375, -15.12060546875, -14.446533203125, -13.7724609375, -13.098388671875, -12.42431640625, -11.750244140625, -11.076171875, -10.402099609375, -9.72802734375, -9.053955078125, -8.3798828125, -7.705810546875, -7.03173828125, -6.357666015625, -5.68359375, -5.009521484375, -4.33544921875, -3.661376953125, -2.9873046875, -2.313232421875, -1.63916015625, -0.965087890625, -0.291015625, 0.383056640625, 1.05712890625, 1.731201171875, 2.4052734375, 3.079345703125, 3.75341796875, 4.427490234375, 5.1015625, 5.775634765625, 6.44970703125, 7.123779296875, 7.7978515625, 8.471923828125, 9.14599609375, 9.820068359375, 10.494140625, 11.168212890625, 11.84228515625, 12.516357421875, 13.1904296875, 13.864501953125, 14.53857421875, 15.212646484375, 15.88671875, 16.560791015625, 17.23486328125, 17.908935546875, 18.5830078125, 19.257080078125, 19.93115234375, 20.605224609375, 21.279296875, 21.953369140625, 22.62744140625, 23.301513671875, 23.9755859375, 24.649658203125, 25.32373046875, 25.997802734375, 26.671875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 10.0, 17.0, 13.0, 27.0, 46.0, 53.0, 75.0, 105.0, 186.0, 270.0, 531.0, 1596.0, 20703.0, 3998150.0, 167419.0, 3098.0, 841.0, 381.0, 216.0, 128.0, 109.0, 71.0, 52.0, 44.0, 33.0, 31.0, 11.0, 14.0, 10.0, 12.0, 6.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.8125, -64.82958984375, -62.8466796875, -60.86376953125, -58.880859375, -56.89794921875, -54.9150390625, -52.93212890625, -50.94921875, -48.96630859375, -46.9833984375, -45.00048828125, -43.017578125, -41.03466796875, -39.0517578125, -37.06884765625, -35.0859375, -33.10302734375, -31.1201171875, -29.13720703125, -27.154296875, -25.17138671875, -23.1884765625, -21.20556640625, -19.22265625, -17.23974609375, -15.2568359375, -13.27392578125, -11.291015625, -9.30810546875, -7.3251953125, -5.34228515625, -3.359375, -1.37646484375, 0.6064453125, 2.58935546875, 4.572265625, 6.55517578125, 8.5380859375, 10.52099609375, 12.50390625, 14.48681640625, 16.4697265625, 18.45263671875, 20.435546875, 22.41845703125, 24.4013671875, 26.38427734375, 28.3671875, 30.35009765625, 32.3330078125, 34.31591796875, 36.298828125, 38.28173828125, 40.2646484375, 42.24755859375, 44.23046875, 46.21337890625, 48.1962890625, 50.17919921875, 52.162109375, 54.14501953125, 56.1279296875, 58.11083984375, 60.09375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 20.0, 71.0, 192.0, 302.0, 254.0, 116.0, 39.0, 10.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.89653015136719, -105.12991333007812, -101.36328887939453, -97.59666442871094, -93.83004760742188, -90.06343078613281, -86.29680633544922, -82.53018188476562, -78.76356506347656, -74.9969482421875, -71.2303237915039, -67.46369934082031, -63.69708251953125, -59.93046188354492, -56.163841247558594, -52.397220611572266, -48.63059997558594, -44.86397933959961, -41.09735870361328, -37.33073806762695, -33.564117431640625, -29.797496795654297, -26.03087615966797, -22.26425552368164, -18.497634887695312, -14.731014251708984, -10.964393615722656, -7.197772979736328, -3.43115234375, 0.3354682922363281, 4.102088928222656, 7.868709564208984, 11.635330200195312, 15.40195083618164, 19.16857147216797, 22.935192108154297, 26.701812744140625, 30.468433380126953, 34.23505401611328, 38.00167465209961, 41.76829528808594, 45.534915924072266, 49.301536560058594, 53.06815719604492, 56.83477783203125, 60.60139846801758, 64.3680191040039, 68.1346435546875, 71.90126037597656, 75.66787719726562, 79.43450164794922, 83.20112609863281, 86.96774291992188, 90.73435974121094, 94.50098419189453, 98.26760864257812, 102.03422546386719, 105.80084228515625, 109.56746673583984, 113.33409118652344, 117.1007080078125, 120.86732482910156, 124.63394927978516, 128.40057373046875, 132.1671905517578]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 7.0, 3.0, 7.0, 8.0, 14.0, 14.0, 20.0, 14.0, 27.0, 39.0, 19.0, 39.0, 35.0, 34.0, 27.0, 34.0, 40.0, 37.0, 34.0, 30.0, 42.0, 41.0, 52.0, 40.0, 31.0, 42.0, 32.0, 32.0, 31.0, 28.0, 28.0, 17.0, 15.0, 17.0, 10.0, 12.0, 12.0, 8.0, 8.0, 10.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-55.50042724609375, -53.971534729003906, -52.44264221191406, -50.91374969482422, -49.384857177734375, -47.8559684753418, -46.32707595825195, -44.79818344116211, -43.269290924072266, -41.74039840698242, -40.21150588989258, -38.682613372802734, -37.153724670410156, -35.62483215332031, -34.09593963623047, -32.567047119140625, -31.03815460205078, -29.509262084960938, -27.980369567871094, -26.451478958129883, -24.92258644104004, -23.393693923950195, -21.864803314208984, -20.33591079711914, -18.807018280029297, -17.278125762939453, -15.749234199523926, -14.220342636108398, -12.691450119018555, -11.162557601928711, -9.633666038513184, -8.104774475097656, -6.5758819580078125, -5.046989917755127, -3.5180978775024414, -1.9892058372497559, -0.4603137969970703, 1.0685782432556152, 2.597470283508301, 4.126361846923828, 5.655254364013672, 7.184146404266357, 8.713038444519043, 10.24193000793457, 11.770822525024414, 13.299715042114258, 14.828606605529785, 16.357498168945312, 17.886390686035156, 19.415283203125, 20.944175720214844, 22.473066329956055, 24.0019588470459, 25.530851364135742, 27.059741973876953, 28.588634490966797, 30.11752700805664, 31.646419525146484, 33.17531204223633, 34.70420455932617, 36.23309326171875, 37.761985778808594, 39.29087829589844, 40.81977081298828, 42.348663330078125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0, 13.0, 8.0, 10.0, 9.0, 10.0, 12.0, 18.0, 13.0, 21.0, 31.0, 12.0, 36.0, 34.0, 28.0, 43.0, 32.0, 37.0, 45.0, 43.0, 46.0, 42.0, 41.0, 28.0, 25.0, 45.0, 34.0, 40.0, 32.0, 38.0, 25.0, 25.0, 21.0, 18.0, 15.0, 8.0, 10.0, 7.0, 9.0, 8.0, 9.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.9610595703125, -7.703369140625, -7.4456787109375, -7.18798828125, -6.9302978515625, -6.672607421875, -6.4149169921875, -6.1572265625, -5.8995361328125, -5.641845703125, -5.3841552734375, -5.12646484375, -4.8687744140625, -4.611083984375, -4.3533935546875, -4.095703125, -3.8380126953125, -3.580322265625, -3.3226318359375, -3.06494140625, -2.8072509765625, -2.549560546875, -2.2918701171875, -2.0341796875, -1.7764892578125, -1.518798828125, -1.2611083984375, -1.00341796875, -0.7457275390625, -0.488037109375, -0.2303466796875, 0.02734375, 0.2850341796875, 0.542724609375, 0.8004150390625, 1.05810546875, 1.3157958984375, 1.573486328125, 1.8311767578125, 2.0888671875, 2.3465576171875, 2.604248046875, 2.8619384765625, 3.11962890625, 3.3773193359375, 3.635009765625, 3.8927001953125, 4.150390625, 4.4080810546875, 4.665771484375, 4.9234619140625, 5.18115234375, 5.4388427734375, 5.696533203125, 5.9542236328125, 6.2119140625, 6.4696044921875, 6.727294921875, 6.9849853515625, 7.24267578125, 7.5003662109375, 7.758056640625, 8.0157470703125, 8.2734375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 5.0, 3.0, 7.0, 15.0, 31.0, 56.0, 59.0, 95.0, 172.0, 330.0, 462.0, 691.0, 1147.0, 1883.0, 2610.0, 3845.0, 6139.0, 9251.0, 14902.0, 23639.0, 39135.0, 67971.0, 128711.0, 323789.0, 198228.0, 91920.0, 51326.0, 30286.0, 18441.0, 11706.0, 7545.0, 4951.0, 3105.0, 2169.0, 1485.0, 845.0, 629.0, 391.0, 239.0, 132.0, 67.0, 52.0, 45.0, 17.0, 14.0, 5.0, 8.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.78515625, -1.7289276123046875, -1.672698974609375, -1.6164703369140625, -1.56024169921875, -1.5040130615234375, -1.447784423828125, -1.3915557861328125, -1.3353271484375, -1.2790985107421875, -1.222869873046875, -1.1666412353515625, -1.11041259765625, -1.0541839599609375, -0.997955322265625, -0.9417266845703125, -0.885498046875, -0.8292694091796875, -0.773040771484375, -0.7168121337890625, -0.66058349609375, -0.6043548583984375, -0.548126220703125, -0.4918975830078125, -0.4356689453125, -0.3794403076171875, -0.323211669921875, -0.2669830322265625, -0.21075439453125, -0.1545257568359375, -0.098297119140625, -0.0420684814453125, 0.01416015625, 0.0703887939453125, 0.126617431640625, 0.1828460693359375, 0.23907470703125, 0.2953033447265625, 0.351531982421875, 0.4077606201171875, 0.4639892578125, 0.5202178955078125, 0.576446533203125, 0.6326751708984375, 0.68890380859375, 0.7451324462890625, 0.801361083984375, 0.8575897216796875, 0.913818359375, 0.9700469970703125, 1.026275634765625, 1.0825042724609375, 1.13873291015625, 1.1949615478515625, 1.251190185546875, 1.3074188232421875, 1.3636474609375, 1.4198760986328125, 1.476104736328125, 1.5323333740234375, 1.58856201171875, 1.6447906494140625, 1.701019287109375, 1.7572479248046875, 1.8134765625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 2.0, 2.0, 6.0, 6.0, 7.0, 12.0, 9.0, 8.0, 10.0, 13.0, 12.0, 14.0, 27.0, 27.0, 29.0, 24.0, 31.0, 30.0, 31.0, 28.0, 34.0, 26.0, 37.0, 44.0, 38.0, 1058.0, 36.0, 36.0, 35.0, 32.0, 29.0, 32.0, 18.0, 46.0, 36.0, 27.0, 18.0, 24.0, 15.0, 13.0, 8.0, 14.0, 6.0, 9.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.63671875, -4.4876708984375, -4.338623046875, -4.1895751953125, -4.04052734375, -3.8914794921875, -3.742431640625, -3.5933837890625, -3.4443359375, -3.2952880859375, -3.146240234375, -2.9971923828125, -2.84814453125, -2.6990966796875, -2.550048828125, -2.4010009765625, -2.251953125, -2.1029052734375, -1.953857421875, -1.8048095703125, -1.65576171875, -1.5067138671875, -1.357666015625, -1.2086181640625, -1.0595703125, -0.9105224609375, -0.761474609375, -0.6124267578125, -0.46337890625, -0.3143310546875, -0.165283203125, -0.0162353515625, 0.1328125, 0.2818603515625, 0.430908203125, 0.5799560546875, 0.72900390625, 0.8780517578125, 1.027099609375, 1.1761474609375, 1.3251953125, 1.4742431640625, 1.623291015625, 1.7723388671875, 1.92138671875, 2.0704345703125, 2.219482421875, 2.3685302734375, 2.517578125, 2.6666259765625, 2.815673828125, 2.9647216796875, 3.11376953125, 3.2628173828125, 3.411865234375, 3.5609130859375, 3.7099609375, 3.8590087890625, 4.008056640625, 4.1571044921875, 4.30615234375, 4.4552001953125, 4.604248046875, 4.7532958984375, 4.90234375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 7.0, 3.0, 6.0, 13.0, 11.0, 25.0, 23.0, 56.0, 97.0, 186.0, 294.0, 481.0, 858.0, 1468.0, 2394.0, 4346.0, 7859.0, 14600.0, 27496.0, 55093.0, 113796.0, 1397938.0, 271321.0, 97749.0, 47687.0, 24425.0, 12795.0, 6999.0, 3865.0, 2147.0, 1234.0, 768.0, 437.0, 251.0, 154.0, 85.0, 48.0, 29.0, 16.0, 7.0, 15.0, 11.0, 8.0, 7.0, 7.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0], "bins": [-2.380859375, -2.308502197265625, -2.23614501953125, -2.163787841796875, -2.0914306640625, -2.019073486328125, -1.94671630859375, -1.874359130859375, -1.802001953125, -1.729644775390625, -1.65728759765625, -1.584930419921875, -1.5125732421875, -1.440216064453125, -1.36785888671875, -1.295501708984375, -1.22314453125, -1.150787353515625, -1.07843017578125, -1.006072998046875, -0.9337158203125, -0.861358642578125, -0.78900146484375, -0.716644287109375, -0.644287109375, -0.571929931640625, -0.49957275390625, -0.427215576171875, -0.3548583984375, -0.282501220703125, -0.21014404296875, -0.137786865234375, -0.0654296875, 0.006927490234375, 0.07928466796875, 0.151641845703125, 0.2239990234375, 0.296356201171875, 0.36871337890625, 0.441070556640625, 0.513427734375, 0.585784912109375, 0.65814208984375, 0.730499267578125, 0.8028564453125, 0.875213623046875, 0.94757080078125, 1.019927978515625, 1.09228515625, 1.164642333984375, 1.23699951171875, 1.309356689453125, 1.3817138671875, 1.454071044921875, 1.52642822265625, 1.598785400390625, 1.671142578125, 1.743499755859375, 1.81585693359375, 1.888214111328125, 1.9605712890625, 2.032928466796875, 2.10528564453125, 2.177642822265625, 2.25]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 8.0, 5.0, 3.0, 4.0, 5.0, 8.0, 10.0, 18.0, 24.0, 30.0, 34.0, 54.0, 75.0, 77.0, 94.0, 120.0, 100.0, 74.0, 69.0, 56.0, 29.0, 18.0, 14.0, 15.0, 20.0, 7.0, 12.0, 4.0, 4.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001308441162109375, -0.001266777515411377, -0.001225113868713379, -0.0011834502220153809, -0.0011417865753173828, -0.0011001229286193848, -0.0010584592819213867, -0.0010167956352233887, -0.0009751319885253906, -0.0009334683418273926, -0.0008918046951293945, -0.0008501410484313965, -0.0008084774017333984, -0.0007668137550354004, -0.0007251501083374023, -0.0006834864616394043, -0.0006418228149414062, -0.0006001591682434082, -0.0005584955215454102, -0.0005168318748474121, -0.00047516822814941406, -0.000433504581451416, -0.00039184093475341797, -0.0003501772880554199, -0.0003085136413574219, -0.00026684999465942383, -0.00022518634796142578, -0.00018352270126342773, -0.0001418590545654297, -0.00010019540786743164, -5.8531761169433594e-05, -1.6868114471435547e-05, 2.47955322265625e-05, 6.645917892456055e-05, 0.0001081228256225586, 0.00014978647232055664, 0.0001914501190185547, 0.00023311376571655273, 0.0002747774124145508, 0.00031644105911254883, 0.0003581047058105469, 0.0003997683525085449, 0.00044143199920654297, 0.000483095645904541, 0.0005247592926025391, 0.0005664229393005371, 0.0006080865859985352, 0.0006497502326965332, 0.0006914138793945312, 0.0007330775260925293, 0.0007747411727905273, 0.0008164048194885254, 0.0008580684661865234, 0.0008997321128845215, 0.0009413957595825195, 0.0009830594062805176, 0.0010247230529785156, 0.0010663866996765137, 0.0011080503463745117, 0.0011497139930725098, 0.0011913776397705078, 0.0012330412864685059, 0.001274704933166504, 0.001316368579864502, 0.0013580322265625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 11.0, 13.0, 15.0, 22.0, 25.0, 29.0, 31.0, 69.0, 101.0, 173.0, 397.0, 2014.0, 1039939.0, 4672.0, 453.0, 216.0, 107.0, 72.0, 42.0, 39.0, 19.0, 16.0, 12.0, 11.0, 12.0, 8.0, 4.0, 5.0, 4.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02935791015625, -0.028428316116333008, -0.027498722076416016, -0.026569128036499023, -0.02563953399658203, -0.02470993995666504, -0.023780345916748047, -0.022850751876831055, -0.021921157836914062, -0.02099156379699707, -0.020061969757080078, -0.019132375717163086, -0.018202781677246094, -0.0172731876373291, -0.01634359359741211, -0.015413999557495117, -0.014484405517578125, -0.013554811477661133, -0.01262521743774414, -0.011695623397827148, -0.010766029357910156, -0.009836435317993164, -0.008906841278076172, -0.00797724723815918, -0.0070476531982421875, -0.006118059158325195, -0.005188465118408203, -0.004258871078491211, -0.0033292770385742188, -0.0023996829986572266, -0.0014700889587402344, -0.0005404949188232422, 0.00038909912109375, 0.0013186931610107422, 0.0022482872009277344, 0.0031778812408447266, 0.004107475280761719, 0.005037069320678711, 0.005966663360595703, 0.006896257400512695, 0.007825851440429688, 0.00875544548034668, 0.009685039520263672, 0.010614633560180664, 0.011544227600097656, 0.012473821640014648, 0.01340341567993164, 0.014333009719848633, 0.015262603759765625, 0.016192197799682617, 0.01712179183959961, 0.0180513858795166, 0.018980979919433594, 0.019910573959350586, 0.020840167999267578, 0.02176976203918457, 0.022699356079101562, 0.023628950119018555, 0.024558544158935547, 0.02548813819885254, 0.02641773223876953, 0.027347326278686523, 0.028276920318603516, 0.029206514358520508, 0.0301361083984375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 13.0, 48.0, 153.0, 274.0, 327.0, 135.0, 41.0, 15.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007776532438583672, -0.0007317668059840798, -0.0006858803099021316, -0.0006399938720278442, -0.0005941074341535568, -0.0005482209962792695, -0.0005023345584049821, -0.0004564480623230338, -0.00041056162444874644, -0.0003646751865744591, -0.00031878871959634125, -0.00027290225261822343, -0.00022701581474393606, -0.00018112936231773347, -0.00013524290989153087, -8.935644291341305e-05, -4.347000503912568e-05, 2.4164473870769143e-06, 4.830289981327951e-05, 9.41893522394821e-05, 0.0001400758046656847, 0.0001859622570918873, 0.0002318487095180899, 0.0002777351764962077, 0.0003236216143704951, 0.00036950805224478245, 0.00041539451922290027, 0.0004612809862010181, 0.0005071674240753055, 0.0005530538619495928, 0.0005989402998238802, 0.0006448267959058285, 0.0006907132919877768, 0.0007365997298620641, 0.0007824861677363515, 0.0008283726638182998, 0.0008742591016925871, 0.0009201455395668745, 0.0009660320356488228, 0.001011918531730771, 0.0010578049113973975, 0.0011036914074793458, 0.0011495777871459723, 0.0011954642832279205, 0.0012413507793098688, 0.0012872371589764953, 0.0013331236550584435, 0.00137901003472507, 0.0014248965308070183, 0.0014707830268889666, 0.001516669406555593, 0.0015625559026375413, 0.0016084422823041677, 0.001654328778386116, 0.0017002152744680643, 0.0017461017705500126, 0.001791988150216639, 0.0018378746462985873, 0.0018837610259652138, 0.001929647522047162, 0.0019755340181291103, 0.0020214205142110586, 0.0020673067774623632, 0.0021131932735443115, 0.00215907976962626]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 6.0, 7.0, 6.0, 4.0, 8.0, 13.0, 8.0, 14.0, 19.0, 9.0, 18.0, 23.0, 21.0, 28.0, 36.0, 35.0, 25.0, 45.0, 44.0, 43.0, 43.0, 35.0, 39.0, 42.0, 30.0, 55.0, 40.0, 27.0, 46.0, 30.0, 27.0, 24.0, 22.0, 22.0, 22.0, 17.0, 13.0, 12.0, 11.0, 6.0, 7.0, 7.0, 2.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0005258321762084961, -0.0005100676789879799, -0.0004943031817674637, -0.0004785386845469475, -0.0004627741873264313, -0.00044700969010591507, -0.00043124519288539886, -0.00041548069566488266, -0.00039971619844436646, -0.00038395170122385025, -0.00036818720400333405, -0.00035242270678281784, -0.00033665820956230164, -0.00032089371234178543, -0.0003051292151212692, -0.000289364717900753, -0.0002736002206802368, -0.0002578357234597206, -0.0002420712262392044, -0.0002263067290186882, -0.000210542231798172, -0.0001947777345776558, -0.0001790132373571396, -0.00016324874013662338, -0.00014748424291610718, -0.00013171974569559097, -0.00011595524847507477, -0.00010019075125455856, -8.442625403404236e-05, -6.866175681352615e-05, -5.289725959300995e-05, -3.7132762372493744e-05, -2.136826515197754e-05, -5.603767931461334e-06, 1.016072928905487e-05, 2.5925226509571075e-05, 4.168972373008728e-05, 5.7454220950603485e-05, 7.321871817111969e-05, 8.89832153916359e-05, 0.0001047477126121521, 0.0001205122098326683, 0.0001362767070531845, 0.00015204120427370071, 0.00016780570149421692, 0.00018357019871473312, 0.00019933469593524933, 0.00021509919315576553, 0.00023086369037628174, 0.00024662818759679794, 0.00026239268481731415, 0.00027815718203783035, 0.00029392167925834656, 0.00030968617647886276, 0.00032545067369937897, 0.00034121517091989517, 0.0003569796681404114, 0.0003727441653609276, 0.0003885086625814438, 0.00040427315980196, 0.0004200376570224762, 0.0004358021542429924, 0.0004515666514635086, 0.0004673311486840248, 0.000483095645904541]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 2.0, 1.0, 1.0, 4.0, 3.0, 13.0, 8.0, 10.0, 9.0, 10.0, 12.0, 18.0, 13.0, 21.0, 31.0, 12.0, 36.0, 34.0, 28.0, 43.0, 32.0, 37.0, 45.0, 43.0, 46.0, 42.0, 41.0, 28.0, 25.0, 45.0, 34.0, 40.0, 32.0, 38.0, 25.0, 25.0, 21.0, 18.0, 15.0, 8.0, 10.0, 7.0, 9.0, 8.0, 9.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.9610595703125, -7.703369140625, -7.4456787109375, -7.18798828125, -6.9302978515625, -6.672607421875, -6.4149169921875, -6.1572265625, -5.8995361328125, -5.641845703125, -5.3841552734375, -5.12646484375, -4.8687744140625, -4.611083984375, -4.3533935546875, -4.095703125, -3.8380126953125, -3.580322265625, -3.3226318359375, -3.06494140625, -2.8072509765625, -2.549560546875, -2.2918701171875, -2.0341796875, -1.7764892578125, -1.518798828125, -1.2611083984375, -1.00341796875, -0.7457275390625, -0.488037109375, -0.2303466796875, 0.02734375, 0.2850341796875, 0.542724609375, 0.8004150390625, 1.05810546875, 1.3157958984375, 1.573486328125, 1.8311767578125, 2.0888671875, 2.3465576171875, 2.604248046875, 2.8619384765625, 3.11962890625, 3.3773193359375, 3.635009765625, 3.8927001953125, 4.150390625, 4.4080810546875, 4.665771484375, 4.9234619140625, 5.18115234375, 5.4388427734375, 5.696533203125, 5.9542236328125, 6.2119140625, 6.4696044921875, 6.727294921875, 6.9849853515625, 7.24267578125, 7.5003662109375, 7.758056640625, 8.0157470703125, 8.2734375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 4.0, 6.0, 9.0, 17.0, 18.0, 19.0, 26.0, 22.0, 32.0, 46.0, 67.0, 77.0, 117.0, 156.0, 208.0, 291.0, 374.0, 516.0, 701.0, 1289.0, 4880.0, 41246.0, 754339.0, 221993.0, 16228.0, 2548.0, 934.0, 594.0, 442.0, 353.0, 247.0, 175.0, 162.0, 93.0, 71.0, 71.0, 36.0, 24.0, 26.0, 18.0, 23.0, 13.0, 13.0, 13.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.625, -19.976318359375, -19.32763671875, -18.678955078125, -18.0302734375, -17.381591796875, -16.73291015625, -16.084228515625, -15.435546875, -14.786865234375, -14.13818359375, -13.489501953125, -12.8408203125, -12.192138671875, -11.54345703125, -10.894775390625, -10.24609375, -9.597412109375, -8.94873046875, -8.300048828125, -7.6513671875, -7.002685546875, -6.35400390625, -5.705322265625, -5.056640625, -4.407958984375, -3.75927734375, -3.110595703125, -2.4619140625, -1.813232421875, -1.16455078125, -0.515869140625, 0.1328125, 0.781494140625, 1.43017578125, 2.078857421875, 2.7275390625, 3.376220703125, 4.02490234375, 4.673583984375, 5.322265625, 5.970947265625, 6.61962890625, 7.268310546875, 7.9169921875, 8.565673828125, 9.21435546875, 9.863037109375, 10.51171875, 11.160400390625, 11.80908203125, 12.457763671875, 13.1064453125, 13.755126953125, 14.40380859375, 15.052490234375, 15.701171875, 16.349853515625, 16.99853515625, 17.647216796875, 18.2958984375, 18.944580078125, 19.59326171875, 20.241943359375, 20.890625]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 8.0, 7.0, 12.0, 8.0, 6.0, 10.0, 13.0, 15.0, 22.0, 25.0, 36.0, 23.0, 43.0, 41.0, 42.0, 49.0, 42.0, 68.0, 150.0, 1663.0, 285.0, 90.0, 53.0, 40.0, 36.0, 30.0, 20.0, 35.0, 29.0, 24.0, 22.0, 15.0, 12.0, 17.0, 16.0, 9.0, 3.0, 6.0, 4.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-26.53125, -25.720947265625, -24.91064453125, -24.100341796875, -23.2900390625, -22.479736328125, -21.66943359375, -20.859130859375, -20.048828125, -19.238525390625, -18.42822265625, -17.617919921875, -16.8076171875, -15.997314453125, -15.18701171875, -14.376708984375, -13.56640625, -12.756103515625, -11.94580078125, -11.135498046875, -10.3251953125, -9.514892578125, -8.70458984375, -7.894287109375, -7.083984375, -6.273681640625, -5.46337890625, -4.653076171875, -3.8427734375, -3.032470703125, -2.22216796875, -1.411865234375, -0.6015625, 0.208740234375, 1.01904296875, 1.829345703125, 2.6396484375, 3.449951171875, 4.26025390625, 5.070556640625, 5.880859375, 6.691162109375, 7.50146484375, 8.311767578125, 9.1220703125, 9.932373046875, 10.74267578125, 11.552978515625, 12.36328125, 13.173583984375, 13.98388671875, 14.794189453125, 15.6044921875, 16.414794921875, 17.22509765625, 18.035400390625, 18.845703125, 19.656005859375, 20.46630859375, 21.276611328125, 22.0869140625, 22.897216796875, 23.70751953125, 24.517822265625, 25.328125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 1.0, 7.0, 6.0, 4.0, 7.0, 9.0, 19.0, 13.0, 14.0, 27.0, 21.0, 32.0, 40.0, 39.0, 57.0, 72.0, 127.0, 297.0, 877.0, 10057.0, 3119841.0, 12348.0, 888.0, 315.0, 133.0, 96.0, 62.0, 59.0, 49.0, 38.0, 26.0, 19.0, 19.0, 14.0, 14.0, 8.0, 9.0, 11.0, 8.0, 4.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.625, -69.3525390625, -67.080078125, -64.8076171875, -62.53515625, -60.2626953125, -57.990234375, -55.7177734375, -53.4453125, -51.1728515625, -48.900390625, -46.6279296875, -44.35546875, -42.0830078125, -39.810546875, -37.5380859375, -35.265625, -32.9931640625, -30.720703125, -28.4482421875, -26.17578125, -23.9033203125, -21.630859375, -19.3583984375, -17.0859375, -14.8134765625, -12.541015625, -10.2685546875, -7.99609375, -5.7236328125, -3.451171875, -1.1787109375, 1.09375, 3.3662109375, 5.638671875, 7.9111328125, 10.18359375, 12.4560546875, 14.728515625, 17.0009765625, 19.2734375, 21.5458984375, 23.818359375, 26.0908203125, 28.36328125, 30.6357421875, 32.908203125, 35.1806640625, 37.453125, 39.7255859375, 41.998046875, 44.2705078125, 46.54296875, 48.8154296875, 51.087890625, 53.3603515625, 55.6328125, 57.9052734375, 60.177734375, 62.4501953125, 64.72265625, 66.9951171875, 69.267578125, 71.5400390625, 73.8125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 56.0, 411.0, 439.0, 97.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.17729949951172, -62.878875732421875, -59.5804557800293, -56.28203201293945, -52.983612060546875, -49.68518829345703, -46.38676452636719, -43.088340759277344, -39.789920806884766, -36.49149703979492, -33.193077087402344, -29.8946533203125, -26.59623146057129, -23.297809600830078, -19.999385833740234, -16.700963973999023, -13.402542114257812, -10.104120254516602, -6.805697441101074, -3.507274627685547, -0.20885276794433594, 3.089569091796875, 6.387992858886719, 9.68641471862793, 12.98483657836914, 16.28325843811035, 19.581680297851562, 22.880104064941406, 26.178525924682617, 29.476947784423828, 32.77537155151367, 36.07379150390625, 39.37220764160156, 42.670631408691406, 45.969051361083984, 49.26747512817383, 52.565895080566406, 55.86431884765625, 59.162742614746094, 62.46116638183594, 65.75958251953125, 69.0580062866211, 72.35643005371094, 75.65484619140625, 78.9532699584961, 82.25169372558594, 85.55011749267578, 88.84854125976562, 92.14696502685547, 95.44538879394531, 98.74381256103516, 102.042236328125, 105.34065246582031, 108.63907623291016, 111.9375, 115.23592376708984, 118.53434753417969, 121.83277130126953, 125.13119506835938, 128.4296112060547, 131.72804260253906, 135.02645874023438, 138.32489013671875, 141.62330627441406, 144.92172241210938]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 8.0, 17.0, 10.0, 17.0, 16.0, 16.0, 22.0, 22.0, 24.0, 34.0, 40.0, 26.0, 34.0, 33.0, 46.0, 43.0, 38.0, 45.0, 27.0, 42.0, 38.0, 42.0, 50.0, 37.0, 34.0, 33.0, 31.0, 24.0, 22.0, 27.0, 14.0, 21.0, 7.0, 6.0, 9.0, 11.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-78.02364349365234, -75.73953247070312, -73.45541381835938, -71.17129516601562, -68.8871841430664, -66.60307312011719, -64.31895446777344, -62.03483963012695, -59.75072479248047, -57.466609954833984, -55.1824951171875, -52.898380279541016, -50.61426544189453, -48.33015060424805, -46.04603576660156, -43.76192092895508, -41.477806091308594, -39.19369125366211, -36.909576416015625, -34.62546157836914, -32.341346740722656, -30.057231903076172, -27.773117065429688, -25.489002227783203, -23.20488739013672, -20.920772552490234, -18.63665771484375, -16.352542877197266, -14.068428039550781, -11.784313201904297, -9.500198364257812, -7.216083526611328, -4.9319610595703125, -2.647846221923828, -0.36373138427734375, 1.9203834533691406, 4.204498291015625, 6.488613128662109, 8.772727966308594, 11.056842803955078, 13.340957641601562, 15.625072479248047, 17.90918731689453, 20.193302154541016, 22.4774169921875, 24.761531829833984, 27.04564666748047, 29.329761505126953, 31.613876342773438, 33.89799118041992, 36.182106018066406, 38.46622085571289, 40.750335693359375, 43.03445053100586, 45.318565368652344, 47.60268020629883, 49.88679504394531, 52.1709098815918, 54.45502471923828, 56.739139556884766, 59.02325439453125, 61.307369232177734, 63.59148406982422, 65.87559509277344, 68.15971374511719]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 6.0, 1.0, 3.0, 4.0, 6.0, 9.0, 16.0, 15.0, 13.0, 8.0, 13.0, 16.0, 12.0, 19.0, 27.0, 31.0, 26.0, 36.0, 36.0, 41.0, 24.0, 31.0, 37.0, 51.0, 32.0, 37.0, 40.0, 35.0, 49.0, 32.0, 32.0, 33.0, 31.0, 29.0, 27.0, 24.0, 18.0, 15.0, 16.0, 9.0, 11.0, 10.0, 9.0, 7.0, 5.0, 6.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.765625, -7.5189208984375, -7.272216796875, -7.0255126953125, -6.77880859375, -6.5321044921875, -6.285400390625, -6.0386962890625, -5.7919921875, -5.5452880859375, -5.298583984375, -5.0518798828125, -4.80517578125, -4.5584716796875, -4.311767578125, -4.0650634765625, -3.818359375, -3.5716552734375, -3.324951171875, -3.0782470703125, -2.83154296875, -2.5848388671875, -2.338134765625, -2.0914306640625, -1.8447265625, -1.5980224609375, -1.351318359375, -1.1046142578125, -0.85791015625, -0.6112060546875, -0.364501953125, -0.1177978515625, 0.12890625, 0.3756103515625, 0.622314453125, 0.8690185546875, 1.11572265625, 1.3624267578125, 1.609130859375, 1.8558349609375, 2.1025390625, 2.3492431640625, 2.595947265625, 2.8426513671875, 3.08935546875, 3.3360595703125, 3.582763671875, 3.8294677734375, 4.076171875, 4.3228759765625, 4.569580078125, 4.8162841796875, 5.06298828125, 5.3096923828125, 5.556396484375, 5.8031005859375, 6.0498046875, 6.2965087890625, 6.543212890625, 6.7899169921875, 7.03662109375, 7.2833251953125, 7.530029296875, 7.7767333984375, 8.0234375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 10.0, 18.0, 7.0, 18.0, 25.0, 23.0, 34.0, 38.0, 55.0, 69.0, 89.0, 91.0, 136.0, 232.0, 278.0, 483.0, 867.0, 1790.0, 5296.0, 23320.0, 223293.0, 1982490.0, 1747332.0, 179771.0, 19651.0, 4804.0, 1723.0, 777.0, 431.0, 286.0, 222.0, 122.0, 109.0, 72.0, 58.0, 60.0, 38.0, 40.0, 30.0, 13.0, 13.0, 10.0, 10.0, 11.0, 11.0, 4.0, 7.0, 5.0, 1.0, 1.0, 1.0, 4.0], "bins": [-18.03125, -17.500244140625, -16.96923828125, -16.438232421875, -15.9072265625, -15.376220703125, -14.84521484375, -14.314208984375, -13.783203125, -13.252197265625, -12.72119140625, -12.190185546875, -11.6591796875, -11.128173828125, -10.59716796875, -10.066162109375, -9.53515625, -9.004150390625, -8.47314453125, -7.942138671875, -7.4111328125, -6.880126953125, -6.34912109375, -5.818115234375, -5.287109375, -4.756103515625, -4.22509765625, -3.694091796875, -3.1630859375, -2.632080078125, -2.10107421875, -1.570068359375, -1.0390625, -0.508056640625, 0.02294921875, 0.553955078125, 1.0849609375, 1.615966796875, 2.14697265625, 2.677978515625, 3.208984375, 3.739990234375, 4.27099609375, 4.802001953125, 5.3330078125, 5.864013671875, 6.39501953125, 6.926025390625, 7.45703125, 7.988037109375, 8.51904296875, 9.050048828125, 9.5810546875, 10.112060546875, 10.64306640625, 11.174072265625, 11.705078125, 12.236083984375, 12.76708984375, 13.298095703125, 13.8291015625, 14.360107421875, 14.89111328125, 15.422119140625, 15.953125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 7.0, 20.0, 40.0, 67.0, 124.0, 267.0, 470.0, 912.0, 958.0, 588.0, 317.0, 143.0, 76.0, 36.0, 18.0, 14.0, 7.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.625, -21.7919921875, -20.958984375, -20.1259765625, -19.29296875, -18.4599609375, -17.626953125, -16.7939453125, -15.9609375, -15.1279296875, -14.294921875, -13.4619140625, -12.62890625, -11.7958984375, -10.962890625, -10.1298828125, -9.296875, -8.4638671875, -7.630859375, -6.7978515625, -5.96484375, -5.1318359375, -4.298828125, -3.4658203125, -2.6328125, -1.7998046875, -0.966796875, -0.1337890625, 0.69921875, 1.5322265625, 2.365234375, 3.1982421875, 4.03125, 4.8642578125, 5.697265625, 6.5302734375, 7.36328125, 8.1962890625, 9.029296875, 9.8623046875, 10.6953125, 11.5283203125, 12.361328125, 13.1943359375, 14.02734375, 14.8603515625, 15.693359375, 16.5263671875, 17.359375, 18.1923828125, 19.025390625, 19.8583984375, 20.69140625, 21.5244140625, 22.357421875, 23.1904296875, 24.0234375, 24.8564453125, 25.689453125, 26.5224609375, 27.35546875, 28.1884765625, 29.021484375, 29.8544921875, 30.6875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 9.0, 3.0, 13.0, 8.0, 19.0, 33.0, 49.0, 88.0, 146.0, 251.0, 573.0, 1789.0, 22820.0, 4082070.0, 82197.0, 2633.0, 754.0, 317.0, 200.0, 130.0, 56.0, 39.0, 31.0, 17.0, 9.0, 15.0, 11.0, 8.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.75, -90.4091796875, -88.068359375, -85.7275390625, -83.38671875, -81.0458984375, -78.705078125, -76.3642578125, -74.0234375, -71.6826171875, -69.341796875, -67.0009765625, -64.66015625, -62.3193359375, -59.978515625, -57.6376953125, -55.296875, -52.9560546875, -50.615234375, -48.2744140625, -45.93359375, -43.5927734375, -41.251953125, -38.9111328125, -36.5703125, -34.2294921875, -31.888671875, -29.5478515625, -27.20703125, -24.8662109375, -22.525390625, -20.1845703125, -17.84375, -15.5029296875, -13.162109375, -10.8212890625, -8.48046875, -6.1396484375, -3.798828125, -1.4580078125, 0.8828125, 3.2236328125, 5.564453125, 7.9052734375, 10.24609375, 12.5869140625, 14.927734375, 17.2685546875, 19.609375, 21.9501953125, 24.291015625, 26.6318359375, 28.97265625, 31.3134765625, 33.654296875, 35.9951171875, 38.3359375, 40.6767578125, 43.017578125, 45.3583984375, 47.69921875, 50.0400390625, 52.380859375, 54.7216796875, 57.0625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 161.0, 670.0, 168.0, 9.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.97335815429688, -121.28545379638672, -111.59754943847656, -101.90965270996094, -92.22174072265625, -82.53384399414062, -72.84593963623047, -63.15803527832031, -53.470130920410156, -43.7822265625, -34.094322204589844, -24.406421661376953, -14.718517303466797, -5.030612945556641, 4.65728759765625, 14.345191955566406, 24.033096313476562, 33.72100067138672, 43.408905029296875, 53.096805572509766, 62.78470993041992, 72.47261047363281, 82.16051483154297, 91.84841918945312, 101.53632354736328, 111.22422790527344, 120.9121322631836, 130.60003662109375, 140.28793334960938, 149.97584533691406, 159.6637420654297, 169.35165405273438, 179.03955078125, 188.72744750976562, 198.4153594970703, 208.10325622558594, 217.79116821289062, 227.47906494140625, 237.16696166992188, 246.85487365722656, 256.54278564453125, 266.2306823730469, 275.9185791015625, 285.60650634765625, 295.2944030761719, 304.9822998046875, 314.6701965332031, 324.35809326171875, 334.0460205078125, 343.7339172363281, 353.42181396484375, 363.1097412109375, 372.7976379394531, 382.48553466796875, 392.1734313964844, 401.861328125, 411.5492248535156, 421.23712158203125, 430.9250183105469, 440.6129455566406, 450.30084228515625, 459.9887390136719, 469.6766357421875, 479.36456298828125, 489.0524597167969]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 6.0, 8.0, 9.0, 13.0, 10.0, 12.0, 11.0, 21.0, 22.0, 34.0, 29.0, 28.0, 33.0, 44.0, 45.0, 48.0, 41.0, 36.0, 38.0, 32.0, 39.0, 26.0, 33.0, 44.0, 43.0, 31.0, 37.0, 29.0, 29.0, 24.0, 24.0, 16.0, 18.0, 9.0, 15.0, 8.0, 9.0, 4.0, 3.0, 8.0, 6.0, 3.0, 7.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-46.9952392578125, -45.60688018798828, -44.21852111816406, -42.83015823364258, -41.44179916381836, -40.05344009399414, -38.665077209472656, -37.27671813964844, -35.88835906982422, -34.5, -33.11164093017578, -31.723278045654297, -30.334918975830078, -28.94655990600586, -27.558198928833008, -26.169837951660156, -24.781478881835938, -23.39311981201172, -22.004758834838867, -20.616397857666016, -19.228038787841797, -17.839679718017578, -16.451318740844727, -15.062958717346191, -13.674598693847656, -12.286238670349121, -10.897878646850586, -9.50951862335205, -8.121158599853516, -6.7327985763549805, -5.344438552856445, -3.95607852935791, -2.567718505859375, -1.1793584823608398, 0.2090015411376953, 1.5973615646362305, 2.9857215881347656, 4.374081611633301, 5.762441635131836, 7.150801658630371, 8.539161682128906, 9.927521705627441, 11.315881729125977, 12.704241752624512, 14.092601776123047, 15.480961799621582, 16.869321823120117, 18.25768280029297, 19.646041870117188, 21.034400939941406, 22.422761917114258, 23.81112289428711, 25.199481964111328, 26.587841033935547, 27.9762020111084, 29.36456298828125, 30.75292205810547, 32.14128112792969, 33.529640197753906, 34.91800308227539, 36.30636215209961, 37.69472122192383, 39.08308410644531, 40.47144317626953, 41.85980224609375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 9.0, 7.0, 4.0, 10.0, 9.0, 9.0, 16.0, 12.0, 12.0, 18.0, 25.0, 24.0, 22.0, 26.0, 30.0, 20.0, 40.0, 29.0, 32.0, 28.0, 32.0, 43.0, 38.0, 42.0, 39.0, 38.0, 40.0, 35.0, 34.0, 17.0, 28.0, 30.0, 24.0, 29.0, 20.0, 26.0, 10.0, 16.0, 15.0, 15.0, 6.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-7.74609375, -7.50042724609375, -7.2547607421875, -7.00909423828125, -6.763427734375, -6.51776123046875, -6.2720947265625, -6.02642822265625, -5.78076171875, -5.53509521484375, -5.2894287109375, -5.04376220703125, -4.798095703125, -4.55242919921875, -4.3067626953125, -4.06109619140625, -3.8154296875, -3.56976318359375, -3.3240966796875, -3.07843017578125, -2.832763671875, -2.58709716796875, -2.3414306640625, -2.09576416015625, -1.85009765625, -1.60443115234375, -1.3587646484375, -1.11309814453125, -0.867431640625, -0.62176513671875, -0.3760986328125, -0.13043212890625, 0.115234375, 0.36090087890625, 0.6065673828125, 0.85223388671875, 1.097900390625, 1.34356689453125, 1.5892333984375, 1.83489990234375, 2.08056640625, 2.32623291015625, 2.5718994140625, 2.81756591796875, 3.063232421875, 3.30889892578125, 3.5545654296875, 3.80023193359375, 4.0458984375, 4.29156494140625, 4.5372314453125, 4.78289794921875, 5.028564453125, 5.27423095703125, 5.5198974609375, 5.76556396484375, 6.01123046875, 6.25689697265625, 6.5025634765625, 6.74822998046875, 6.993896484375, 7.23956298828125, 7.4852294921875, 7.73089599609375, 7.9765625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 13.0, 11.0, 22.0, 37.0, 43.0, 71.0, 122.0, 171.0, 281.0, 373.0, 594.0, 781.0, 1164.0, 1565.0, 2287.0, 3177.0, 4763.0, 6929.0, 10045.0, 14872.0, 22257.0, 33498.0, 51990.0, 85401.0, 168423.0, 304367.0, 128644.0, 71504.0, 44649.0, 29252.0, 19268.0, 13339.0, 8919.0, 6181.0, 4191.0, 2845.0, 1959.0, 1402.0, 941.0, 702.0, 482.0, 338.0, 230.0, 150.0, 109.0, 66.0, 56.0, 30.0, 16.0, 9.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.583984375, -1.5334320068359375, -1.482879638671875, -1.4323272705078125, -1.38177490234375, -1.3312225341796875, -1.280670166015625, -1.2301177978515625, -1.1795654296875, -1.1290130615234375, -1.078460693359375, -1.0279083251953125, -0.97735595703125, -0.9268035888671875, -0.876251220703125, -0.8256988525390625, -0.775146484375, -0.7245941162109375, -0.674041748046875, -0.6234893798828125, -0.57293701171875, -0.5223846435546875, -0.471832275390625, -0.4212799072265625, -0.3707275390625, -0.3201751708984375, -0.269622802734375, -0.2190704345703125, -0.16851806640625, -0.1179656982421875, -0.067413330078125, -0.0168609619140625, 0.03369140625, 0.0842437744140625, 0.134796142578125, 0.1853485107421875, 0.23590087890625, 0.2864532470703125, 0.337005615234375, 0.3875579833984375, 0.4381103515625, 0.4886627197265625, 0.539215087890625, 0.5897674560546875, 0.64031982421875, 0.6908721923828125, 0.741424560546875, 0.7919769287109375, 0.842529296875, 0.8930816650390625, 0.943634033203125, 0.9941864013671875, 1.04473876953125, 1.0952911376953125, 1.145843505859375, 1.1963958740234375, 1.2469482421875, 1.2975006103515625, 1.348052978515625, 1.3986053466796875, 1.44915771484375, 1.4997100830078125, 1.550262451171875, 1.6008148193359375, 1.6513671875]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 9.0, 8.0, 13.0, 9.0, 9.0, 8.0, 12.0, 19.0, 18.0, 16.0, 19.0, 33.0, 36.0, 23.0, 32.0, 34.0, 25.0, 23.0, 37.0, 36.0, 37.0, 1063.0, 46.0, 42.0, 38.0, 48.0, 33.0, 32.0, 26.0, 26.0, 28.0, 38.0, 20.0, 28.0, 20.0, 16.0, 6.0, 22.0, 9.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.33984375, -5.17303466796875, -5.0062255859375, -4.83941650390625, -4.672607421875, -4.50579833984375, -4.3389892578125, -4.17218017578125, -4.00537109375, -3.83856201171875, -3.6717529296875, -3.50494384765625, -3.338134765625, -3.17132568359375, -3.0045166015625, -2.83770751953125, -2.6708984375, -2.50408935546875, -2.3372802734375, -2.17047119140625, -2.003662109375, -1.83685302734375, -1.6700439453125, -1.50323486328125, -1.33642578125, -1.16961669921875, -1.0028076171875, -0.83599853515625, -0.669189453125, -0.50238037109375, -0.3355712890625, -0.16876220703125, -0.001953125, 0.16485595703125, 0.3316650390625, 0.49847412109375, 0.665283203125, 0.83209228515625, 0.9989013671875, 1.16571044921875, 1.33251953125, 1.49932861328125, 1.6661376953125, 1.83294677734375, 1.999755859375, 2.16656494140625, 2.3333740234375, 2.50018310546875, 2.6669921875, 2.83380126953125, 3.0006103515625, 3.16741943359375, 3.334228515625, 3.50103759765625, 3.6678466796875, 3.83465576171875, 4.00146484375, 4.16827392578125, 4.3350830078125, 4.50189208984375, 4.668701171875, 4.83551025390625, 5.0023193359375, 5.16912841796875, 5.3359375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 6.0, 5.0, 28.0, 20.0, 24.0, 65.0, 100.0, 161.0, 281.0, 421.0, 821.0, 1411.0, 2448.0, 4618.0, 8440.0, 16553.0, 31896.0, 64926.0, 144889.0, 1471936.0, 190546.0, 77769.0, 38321.0, 19270.0, 10207.0, 5312.0, 2952.0, 1577.0, 844.0, 534.0, 290.0, 171.0, 89.0, 66.0, 36.0, 21.0, 15.0, 9.0, 16.0, 6.0, 9.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.552734375, -2.472015380859375, -2.39129638671875, -2.310577392578125, -2.2298583984375, -2.149139404296875, -2.06842041015625, -1.987701416015625, -1.906982421875, -1.826263427734375, -1.74554443359375, -1.664825439453125, -1.5841064453125, -1.503387451171875, -1.42266845703125, -1.341949462890625, -1.26123046875, -1.180511474609375, -1.09979248046875, -1.019073486328125, -0.9383544921875, -0.857635498046875, -0.77691650390625, -0.696197509765625, -0.615478515625, -0.534759521484375, -0.45404052734375, -0.373321533203125, -0.2926025390625, -0.211883544921875, -0.13116455078125, -0.050445556640625, 0.0302734375, 0.110992431640625, 0.19171142578125, 0.272430419921875, 0.3531494140625, 0.433868408203125, 0.51458740234375, 0.595306396484375, 0.676025390625, 0.756744384765625, 0.83746337890625, 0.918182373046875, 0.9989013671875, 1.079620361328125, 1.16033935546875, 1.241058349609375, 1.32177734375, 1.402496337890625, 1.48321533203125, 1.563934326171875, 1.6446533203125, 1.725372314453125, 1.80609130859375, 1.886810302734375, 1.967529296875, 2.048248291015625, 2.12896728515625, 2.209686279296875, 2.2904052734375, 2.371124267578125, 2.45184326171875, 2.532562255859375, 2.61328125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 6.0, 6.0, 4.0, 3.0, 3.0, 5.0, 8.0, 11.0, 5.0, 13.0, 9.0, 14.0, 19.0, 22.0, 15.0, 24.0, 34.0, 32.0, 44.0, 49.0, 56.0, 59.0, 49.0, 61.0, 51.0, 68.0, 49.0, 46.0, 30.0, 36.0, 25.0, 23.0, 10.0, 25.0, 16.0, 11.0, 10.0, 9.0, 11.0, 5.0, 6.0, 4.0, 6.0, 3.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.001068115234375, -0.0010369420051574707, -0.0010057687759399414, -0.0009745955467224121, -0.0009434223175048828, -0.0009122490882873535, -0.0008810758590698242, -0.0008499026298522949, -0.0008187294006347656, -0.0007875561714172363, -0.000756382942199707, -0.0007252097129821777, -0.0006940364837646484, -0.0006628632545471191, -0.0006316900253295898, -0.0006005167961120605, -0.0005693435668945312, -0.000538170337677002, -0.0005069971084594727, -0.00047582387924194336, -0.00044465065002441406, -0.00041347742080688477, -0.00038230419158935547, -0.00035113096237182617, -0.0003199577331542969, -0.0002887845039367676, -0.0002576112747192383, -0.00022643804550170898, -0.0001952648162841797, -0.0001640915870666504, -0.0001329183578491211, -0.0001017451286315918, -7.05718994140625e-05, -3.93986701965332e-05, -8.225440979003906e-06, 2.294778823852539e-05, 5.412101745605469e-05, 8.529424667358398e-05, 0.00011646747589111328, 0.00014764070510864258, 0.00017881393432617188, 0.00020998716354370117, 0.00024116039276123047, 0.00027233362197875977, 0.00030350685119628906, 0.00033468008041381836, 0.00036585330963134766, 0.00039702653884887695, 0.00042819976806640625, 0.00045937299728393555, 0.0004905462265014648, 0.0005217194557189941, 0.0005528926849365234, 0.0005840659141540527, 0.000615239143371582, 0.0006464123725891113, 0.0006775856018066406, 0.0007087588310241699, 0.0007399320602416992, 0.0007711052894592285, 0.0008022785186767578, 0.0008334517478942871, 0.0008646249771118164, 0.0008957982063293457, 0.000926971435546875]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 3.0, 5.0, 6.0, 3.0, 7.0, 7.0, 8.0, 10.0, 17.0, 20.0, 34.0, 30.0, 28.0, 42.0, 50.0, 64.0, 93.0, 158.0, 225.0, 341.0, 763.0, 12378.0, 1024466.0, 7911.0, 716.0, 352.0, 217.0, 156.0, 95.0, 72.0, 45.0, 32.0, 34.0, 35.0, 22.0, 26.0, 12.0, 14.0, 10.0, 6.0, 10.0, 9.0, 3.0, 2.0, 8.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01947021484375, -0.018786191940307617, -0.018102169036865234, -0.01741814613342285, -0.01673412322998047, -0.016050100326538086, -0.015366077423095703, -0.01468205451965332, -0.013998031616210938, -0.013314008712768555, -0.012629985809326172, -0.011945962905883789, -0.011261940002441406, -0.010577917098999023, -0.00989389419555664, -0.009209871292114258, -0.008525848388671875, -0.007841825485229492, -0.007157802581787109, -0.0064737796783447266, -0.005789756774902344, -0.005105733871459961, -0.004421710968017578, -0.0037376880645751953, -0.0030536651611328125, -0.0023696422576904297, -0.0016856193542480469, -0.001001596450805664, -0.00031757354736328125, 0.00036644935607910156, 0.0010504722595214844, 0.0017344951629638672, 0.00241851806640625, 0.003102540969848633, 0.0037865638732910156, 0.0044705867767333984, 0.005154609680175781, 0.005838632583618164, 0.006522655487060547, 0.00720667839050293, 0.007890701293945312, 0.008574724197387695, 0.009258747100830078, 0.009942770004272461, 0.010626792907714844, 0.011310815811157227, 0.01199483871459961, 0.012678861618041992, 0.013362884521484375, 0.014046907424926758, 0.01473093032836914, 0.015414953231811523, 0.016098976135253906, 0.01678299903869629, 0.017467021942138672, 0.018151044845581055, 0.018835067749023438, 0.01951909065246582, 0.020203113555908203, 0.020887136459350586, 0.02157115936279297, 0.02225518226623535, 0.022939205169677734, 0.023623228073120117, 0.0243072509765625]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 10.0, 20.0, 114.0, 283.0, 307.0, 189.0, 71.0, 18.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010907640680670738, -0.0010342790046706796, -0.0009777940576896071, -0.0009213089942932129, -0.0008648239308968186, -0.0008083389257080853, -0.000751853920519352, -0.0006953688571229577, -0.0006388838519342244, -0.000582398846745491, -0.0005259137833490968, -0.00046942877816036344, -0.00041294374386779964, -0.00035645870957523584, -0.0002999737043865025, -0.0002434886700939387, -0.0001870036358013749, -0.00013051860150881112, -7.403358176816255e-05, -1.754856202751398e-05, 3.8936472265049815e-05, 9.542150655761361e-05, 0.00015190651174634695, 0.00020839154603891075, 0.00026487658033147454, 0.00032136161462403834, 0.00037784664891660213, 0.0004343316541053355, 0.0004908166592940688, 0.0005473017226904631, 0.0006037867278791964, 0.0006602717330679297, 0.000716756796464324, 0.0007732418016530573, 0.0008297268650494516, 0.0008862118702381849, 0.0009426969336345792, 0.0009991819970309734, 0.0010556669440120459, 0.0011121520074084401, 0.0011686370708048344, 0.0012251221342012286, 0.001281607081182301, 0.0013380921445786953, 0.0013945772079750896, 0.0014510622713714838, 0.0015075472183525562, 0.0015640322817489505, 0.001620517228730023, 0.0016770022921264172, 0.0017334872391074896, 0.0017899723025038838, 0.001846457365900278, 0.0019029423128813505, 0.001959427259862423, 0.002015912439674139, 0.0020723973866552114, 0.002128882333636284, 0.002185367513448, 0.0022418524604290724, 0.002298337407410145, 0.002354822587221861, 0.0024113075342029333, 0.0024677924811840057, 0.002524277660995722]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 10.0, 6.0, 13.0, 10.0, 9.0, 13.0, 19.0, 28.0, 21.0, 25.0, 24.0, 35.0, 26.0, 45.0, 42.0, 44.0, 51.0, 45.0, 50.0, 48.0, 40.0, 45.0, 42.0, 26.0, 43.0, 33.0, 28.0, 30.0, 31.0, 20.0, 13.0, 23.0, 17.0, 10.0, 5.0, 5.0, 10.0, 7.0, 0.0, 4.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0006924271583557129, -0.000672302208840847, -0.0006521772593259811, -0.0006320523098111153, -0.0006119273602962494, -0.0005918024107813835, -0.0005716774612665176, -0.0005515525117516518, -0.0005314275622367859, -0.00051130261272192, -0.0004911776632070541, -0.00047105271369218826, -0.0004509277641773224, -0.0004308028146624565, -0.00041067786514759064, -0.00039055291563272476, -0.0003704279661178589, -0.000350303016602993, -0.00033017806708812714, -0.00031005311757326126, -0.0002899281680583954, -0.0002698032185435295, -0.00024967826902866364, -0.00022955331951379776, -0.00020942836999893188, -0.000189303420484066, -0.00016917847096920013, -0.00014905352145433426, -0.00012892857193946838, -0.00010880362242460251, -8.867867290973663e-05, -6.855372339487076e-05, -4.842877388000488e-05, -2.8303824365139008e-05, -8.178874850273132e-06, 1.1946074664592743e-05, 3.207102417945862e-05, 5.2195973694324493e-05, 7.232092320919037e-05, 9.244587272405624e-05, 0.00011257082223892212, 0.000132695771753788, 0.00015282072126865387, 0.00017294567078351974, 0.00019307062029838562, 0.0002131955698132515, 0.00023332051932811737, 0.00025344546884298325, 0.0002735704183578491, 0.000293695367872715, 0.00031382031738758087, 0.00033394526690244675, 0.0003540702164173126, 0.0003741951659321785, 0.00039432011544704437, 0.00041444506496191025, 0.0004345700144767761, 0.000454694963991642, 0.0004748199135065079, 0.0004949448630213737, 0.0005150698125362396, 0.0005351947620511055, 0.0005553197115659714, 0.0005754446610808372, 0.0005955696105957031]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 9.0, 7.0, 4.0, 10.0, 9.0, 9.0, 16.0, 12.0, 12.0, 18.0, 25.0, 24.0, 22.0, 26.0, 30.0, 20.0, 40.0, 29.0, 32.0, 28.0, 32.0, 43.0, 38.0, 42.0, 39.0, 38.0, 40.0, 35.0, 34.0, 17.0, 28.0, 30.0, 24.0, 29.0, 20.0, 26.0, 10.0, 16.0, 15.0, 15.0, 6.0, 8.0, 5.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-7.74609375, -7.50042724609375, -7.2547607421875, -7.00909423828125, -6.763427734375, -6.51776123046875, -6.2720947265625, -6.02642822265625, -5.78076171875, -5.53509521484375, -5.2894287109375, -5.04376220703125, -4.798095703125, -4.55242919921875, -4.3067626953125, -4.06109619140625, -3.8154296875, -3.56976318359375, -3.3240966796875, -3.07843017578125, -2.832763671875, -2.58709716796875, -2.3414306640625, -2.09576416015625, -1.85009765625, -1.60443115234375, -1.3587646484375, -1.11309814453125, -0.867431640625, -0.62176513671875, -0.3760986328125, -0.13043212890625, 0.115234375, 0.36090087890625, 0.6065673828125, 0.85223388671875, 1.097900390625, 1.34356689453125, 1.5892333984375, 1.83489990234375, 2.08056640625, 2.32623291015625, 2.5718994140625, 2.81756591796875, 3.063232421875, 3.30889892578125, 3.5545654296875, 3.80023193359375, 4.0458984375, 4.29156494140625, 4.5372314453125, 4.78289794921875, 5.028564453125, 5.27423095703125, 5.5198974609375, 5.76556396484375, 6.01123046875, 6.25689697265625, 6.5025634765625, 6.74822998046875, 6.993896484375, 7.23956298828125, 7.4852294921875, 7.73089599609375, 7.9765625]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 8.0, 7.0, 8.0, 6.0, 21.0, 13.0, 21.0, 25.0, 33.0, 35.0, 45.0, 45.0, 69.0, 87.0, 77.0, 132.0, 208.0, 302.0, 504.0, 1047.0, 2022.0, 4743.0, 11405.0, 30657.0, 88576.0, 301574.0, 411248.0, 126594.0, 42118.0, 15109.0, 5969.0, 2676.0, 1276.0, 604.0, 360.0, 246.0, 143.0, 123.0, 100.0, 76.0, 48.0, 50.0, 28.0, 25.0, 21.0, 14.0, 19.0, 9.0, 8.0, 10.0, 3.0, 4.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-9.8984375, -9.5806884765625, -9.262939453125, -8.9451904296875, -8.62744140625, -8.3096923828125, -7.991943359375, -7.6741943359375, -7.3564453125, -7.0386962890625, -6.720947265625, -6.4031982421875, -6.08544921875, -5.7677001953125, -5.449951171875, -5.1322021484375, -4.814453125, -4.4967041015625, -4.178955078125, -3.8612060546875, -3.54345703125, -3.2257080078125, -2.907958984375, -2.5902099609375, -2.2724609375, -1.9547119140625, -1.636962890625, -1.3192138671875, -1.00146484375, -0.6837158203125, -0.365966796875, -0.0482177734375, 0.26953125, 0.5872802734375, 0.905029296875, 1.2227783203125, 1.54052734375, 1.8582763671875, 2.176025390625, 2.4937744140625, 2.8115234375, 3.1292724609375, 3.447021484375, 3.7647705078125, 4.08251953125, 4.4002685546875, 4.718017578125, 5.0357666015625, 5.353515625, 5.6712646484375, 5.989013671875, 6.3067626953125, 6.62451171875, 6.9422607421875, 7.260009765625, 7.5777587890625, 7.8955078125, 8.2132568359375, 8.531005859375, 8.8487548828125, 9.16650390625, 9.4842529296875, 9.802001953125, 10.1197509765625, 10.4375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 6.0, 4.0, 5.0, 5.0, 6.0, 6.0, 12.0, 7.0, 11.0, 15.0, 15.0, 16.0, 20.0, 29.0, 23.0, 24.0, 43.0, 50.0, 47.0, 63.0, 97.0, 178.0, 1506.0, 269.0, 110.0, 73.0, 69.0, 36.0, 46.0, 43.0, 27.0, 28.0, 25.0, 20.0, 21.0, 17.0, 14.0, 16.0, 8.0, 7.0, 13.0, 7.0, 5.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-24.921875, -24.159423828125, -23.39697265625, -22.634521484375, -21.8720703125, -21.109619140625, -20.34716796875, -19.584716796875, -18.822265625, -18.059814453125, -17.29736328125, -16.534912109375, -15.7724609375, -15.010009765625, -14.24755859375, -13.485107421875, -12.72265625, -11.960205078125, -11.19775390625, -10.435302734375, -9.6728515625, -8.910400390625, -8.14794921875, -7.385498046875, -6.623046875, -5.860595703125, -5.09814453125, -4.335693359375, -3.5732421875, -2.810791015625, -2.04833984375, -1.285888671875, -0.5234375, 0.239013671875, 1.00146484375, 1.763916015625, 2.5263671875, 3.288818359375, 4.05126953125, 4.813720703125, 5.576171875, 6.338623046875, 7.10107421875, 7.863525390625, 8.6259765625, 9.388427734375, 10.15087890625, 10.913330078125, 11.67578125, 12.438232421875, 13.20068359375, 13.963134765625, 14.7255859375, 15.488037109375, 16.25048828125, 17.012939453125, 17.775390625, 18.537841796875, 19.30029296875, 20.062744140625, 20.8251953125, 21.587646484375, 22.35009765625, 23.112548828125, 23.875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 11.0, 18.0, 17.0, 40.0, 40.0, 62.0, 92.0, 100.0, 151.0, 220.0, 321.0, 715.0, 3353.0, 109315.0, 2976530.0, 50908.0, 2218.0, 578.0, 320.0, 191.0, 135.0, 98.0, 65.0, 46.0, 39.0, 22.0, 20.0, 13.0, 16.0, 10.0, 6.0, 5.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-40.78125, -39.48291015625, -38.1845703125, -36.88623046875, -35.587890625, -34.28955078125, -32.9912109375, -31.69287109375, -30.39453125, -29.09619140625, -27.7978515625, -26.49951171875, -25.201171875, -23.90283203125, -22.6044921875, -21.30615234375, -20.0078125, -18.70947265625, -17.4111328125, -16.11279296875, -14.814453125, -13.51611328125, -12.2177734375, -10.91943359375, -9.62109375, -8.32275390625, -7.0244140625, -5.72607421875, -4.427734375, -3.12939453125, -1.8310546875, -0.53271484375, 0.765625, 2.06396484375, 3.3623046875, 4.66064453125, 5.958984375, 7.25732421875, 8.5556640625, 9.85400390625, 11.15234375, 12.45068359375, 13.7490234375, 15.04736328125, 16.345703125, 17.64404296875, 18.9423828125, 20.24072265625, 21.5390625, 22.83740234375, 24.1357421875, 25.43408203125, 26.732421875, 28.03076171875, 29.3291015625, 30.62744140625, 31.92578125, 33.22412109375, 34.5224609375, 35.82080078125, 37.119140625, 38.41748046875, 39.7158203125, 41.01416015625, 42.3125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 267.0, 603.0, 131.0, 7.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.729103088378906, -39.069000244140625, -34.408897399902344, -29.748796463012695, -25.088693618774414, -20.428590774536133, -15.768489837646484, -11.108386993408203, -6.448284149169922, -1.7881817817687988, 2.871920585632324, 7.532022476196289, 12.19212532043457, 16.85222816467285, 21.5123291015625, 26.17243194580078, 30.832534790039062, 35.492637634277344, 40.152740478515625, 44.812843322753906, 49.47294616699219, 54.13304901123047, 58.793148040771484, 63.453250885009766, 68.11335754394531, 72.7734603881836, 77.43356323242188, 82.09366607666016, 86.75376892089844, 91.41387176513672, 96.073974609375, 100.73406982421875, 105.39418029785156, 110.05428314208984, 114.71438598632812, 119.3744888305664, 124.03459167480469, 128.69468688964844, 133.35479736328125, 138.014892578125, 142.6750030517578, 147.33509826660156, 151.99520874023438, 156.65530395507812, 161.31541442871094, 165.9755096435547, 170.6356201171875, 175.29571533203125, 179.955810546875, 184.61590576171875, 189.27601623535156, 193.9361114501953, 198.59622192382812, 203.25631713867188, 207.9164276123047, 212.57652282714844, 217.23663330078125, 221.896728515625, 226.5568389892578, 231.21693420410156, 235.87704467773438, 240.53713989257812, 245.19725036621094, 249.8573455810547, 254.5174560546875]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 5.0, 9.0, 4.0, 16.0, 6.0, 16.0, 11.0, 25.0, 14.0, 23.0, 21.0, 29.0, 34.0, 30.0, 34.0, 35.0, 44.0, 41.0, 37.0, 45.0, 48.0, 34.0, 41.0, 28.0, 31.0, 44.0, 34.0, 27.0, 39.0, 30.0, 29.0, 15.0, 22.0, 9.0, 14.0, 13.0, 20.0, 12.0, 9.0, 6.0, 9.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-59.62049102783203, -57.90251541137695, -56.184539794921875, -54.46656036376953, -52.74858474731445, -51.030609130859375, -49.3126335144043, -47.59465789794922, -45.876678466796875, -44.1587028503418, -42.44072723388672, -40.722747802734375, -39.0047721862793, -37.28679656982422, -35.56882095336914, -33.85084533691406, -32.132869720458984, -30.414894104003906, -28.696916580200195, -26.978940963745117, -25.260963439941406, -23.542987823486328, -21.82501220703125, -20.107036590576172, -18.38905906677246, -16.671083450317383, -14.953105926513672, -13.235130310058594, -11.5171537399292, -9.799177169799805, -8.081201553344727, -6.363224983215332, -4.6452484130859375, -2.927272081375122, -1.2092957496643066, 0.5086803436279297, 2.226656913757324, 3.9446334838867188, 5.662609100341797, 7.380585670471191, 9.098562240600586, 10.81653881072998, 12.534515380859375, 14.252490997314453, 15.970467567443848, 17.688444137573242, 19.40641975402832, 21.12439727783203, 22.84237289428711, 24.560348510742188, 26.2783260345459, 27.996301651000977, 29.714279174804688, 31.432254791259766, 33.150230407714844, 34.86820602416992, 36.586181640625, 38.30415725708008, 40.022132873535156, 41.7401123046875, 43.45808792114258, 45.176063537597656, 46.894039154052734, 48.61201477050781, 50.329994201660156]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 5.0, 14.0, 15.0, 10.0, 13.0, 17.0, 22.0, 22.0, 16.0, 28.0, 21.0, 32.0, 25.0, 48.0, 34.0, 33.0, 38.0, 46.0, 24.0, 38.0, 36.0, 39.0, 36.0, 39.0, 32.0, 43.0, 36.0, 20.0, 23.0, 30.0, 21.0, 21.0, 17.0, 10.0, 12.0, 14.0, 9.0, 5.0, 6.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-8.359375, -8.095703125, -7.83203125, -7.568359375, -7.3046875, -7.041015625, -6.77734375, -6.513671875, -6.25, -5.986328125, -5.72265625, -5.458984375, -5.1953125, -4.931640625, -4.66796875, -4.404296875, -4.140625, -3.876953125, -3.61328125, -3.349609375, -3.0859375, -2.822265625, -2.55859375, -2.294921875, -2.03125, -1.767578125, -1.50390625, -1.240234375, -0.9765625, -0.712890625, -0.44921875, -0.185546875, 0.078125, 0.341796875, 0.60546875, 0.869140625, 1.1328125, 1.396484375, 1.66015625, 1.923828125, 2.1875, 2.451171875, 2.71484375, 2.978515625, 3.2421875, 3.505859375, 3.76953125, 4.033203125, 4.296875, 4.560546875, 4.82421875, 5.087890625, 5.3515625, 5.615234375, 5.87890625, 6.142578125, 6.40625, 6.669921875, 6.93359375, 7.197265625, 7.4609375, 7.724609375, 7.98828125, 8.251953125, 8.515625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 2.0, 8.0, 9.0, 10.0, 6.0, 11.0, 13.0, 19.0, 21.0, 30.0, 45.0, 52.0, 80.0, 150.0, 259.0, 617.0, 1966.0, 9234.0, 157222.0, 2862354.0, 1122175.0, 33545.0, 4297.0, 1114.0, 447.0, 211.0, 97.0, 61.0, 48.0, 40.0, 29.0, 19.0, 16.0, 12.0, 10.0, 20.0, 7.0, 4.0, 3.0, 4.0, 2.0, 2.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0], "bins": [-28.359375, -27.566650390625, -26.77392578125, -25.981201171875, -25.1884765625, -24.395751953125, -23.60302734375, -22.810302734375, -22.017578125, -21.224853515625, -20.43212890625, -19.639404296875, -18.8466796875, -18.053955078125, -17.26123046875, -16.468505859375, -15.67578125, -14.883056640625, -14.09033203125, -13.297607421875, -12.5048828125, -11.712158203125, -10.91943359375, -10.126708984375, -9.333984375, -8.541259765625, -7.74853515625, -6.955810546875, -6.1630859375, -5.370361328125, -4.57763671875, -3.784912109375, -2.9921875, -2.199462890625, -1.40673828125, -0.614013671875, 0.1787109375, 0.971435546875, 1.76416015625, 2.556884765625, 3.349609375, 4.142333984375, 4.93505859375, 5.727783203125, 6.5205078125, 7.313232421875, 8.10595703125, 8.898681640625, 9.69140625, 10.484130859375, 11.27685546875, 12.069580078125, 12.8623046875, 13.655029296875, 14.44775390625, 15.240478515625, 16.033203125, 16.825927734375, 17.61865234375, 18.411376953125, 19.2041015625, 19.996826171875, 20.78955078125, 21.582275390625, 22.375]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 7.0, 6.0, 15.0, 14.0, 20.0, 30.0, 45.0, 56.0, 98.0, 167.0, 274.0, 351.0, 518.0, 598.0, 539.0, 453.0, 295.0, 190.0, 113.0, 84.0, 52.0, 39.0, 27.0, 18.0, 13.0, 8.0, 10.0, 13.0, 5.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-13.953125, -13.48388671875, -13.0146484375, -12.54541015625, -12.076171875, -11.60693359375, -11.1376953125, -10.66845703125, -10.19921875, -9.72998046875, -9.2607421875, -8.79150390625, -8.322265625, -7.85302734375, -7.3837890625, -6.91455078125, -6.4453125, -5.97607421875, -5.5068359375, -5.03759765625, -4.568359375, -4.09912109375, -3.6298828125, -3.16064453125, -2.69140625, -2.22216796875, -1.7529296875, -1.28369140625, -0.814453125, -0.34521484375, 0.1240234375, 0.59326171875, 1.0625, 1.53173828125, 2.0009765625, 2.47021484375, 2.939453125, 3.40869140625, 3.8779296875, 4.34716796875, 4.81640625, 5.28564453125, 5.7548828125, 6.22412109375, 6.693359375, 7.16259765625, 7.6318359375, 8.10107421875, 8.5703125, 9.03955078125, 9.5087890625, 9.97802734375, 10.447265625, 10.91650390625, 11.3857421875, 11.85498046875, 12.32421875, 12.79345703125, 13.2626953125, 13.73193359375, 14.201171875, 14.67041015625, 15.1396484375, 15.60888671875, 16.078125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 7.0, 6.0, 22.0, 15.0, 18.0, 32.0, 57.0, 90.0, 149.0, 276.0, 670.0, 1868.0, 8836.0, 90830.0, 3258376.0, 794888.0, 31362.0, 4564.0, 1214.0, 478.0, 205.0, 111.0, 54.0, 38.0, 34.0, 23.0, 12.0, 8.0, 13.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.515625, -24.486572265625, -23.45751953125, -22.428466796875, -21.3994140625, -20.370361328125, -19.34130859375, -18.312255859375, -17.283203125, -16.254150390625, -15.22509765625, -14.196044921875, -13.1669921875, -12.137939453125, -11.10888671875, -10.079833984375, -9.05078125, -8.021728515625, -6.99267578125, -5.963623046875, -4.9345703125, -3.905517578125, -2.87646484375, -1.847412109375, -0.818359375, 0.210693359375, 1.23974609375, 2.268798828125, 3.2978515625, 4.326904296875, 5.35595703125, 6.385009765625, 7.4140625, 8.443115234375, 9.47216796875, 10.501220703125, 11.5302734375, 12.559326171875, 13.58837890625, 14.617431640625, 15.646484375, 16.675537109375, 17.70458984375, 18.733642578125, 19.7626953125, 20.791748046875, 21.82080078125, 22.849853515625, 23.87890625, 24.907958984375, 25.93701171875, 26.966064453125, 27.9951171875, 29.024169921875, 30.05322265625, 31.082275390625, 32.111328125, 33.140380859375, 34.16943359375, 35.198486328125, 36.2275390625, 37.256591796875, 38.28564453125, 39.314697265625, 40.34375]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 15.0, 329.0, 558.0, 108.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.63906860351562, -63.900028228759766, -56.160987854003906, -48.42194747924805, -40.68290710449219, -32.94386672973633, -25.20482635498047, -17.46578598022461, -9.72674560546875, -1.9877052307128906, 5.751335144042969, 13.490375518798828, 21.229415893554688, 28.968456268310547, 36.707496643066406, 44.446537017822266, 52.185577392578125, 59.924617767333984, 67.66365814208984, 75.40269470214844, 83.14173889160156, 90.88078308105469, 98.61981964111328, 106.35885620117188, 114.097900390625, 121.83694458007812, 129.57598876953125, 137.3150177001953, 145.05406188964844, 152.79310607910156, 160.53213500976562, 168.27117919921875, 176.01022338867188, 183.749267578125, 191.48831176757812, 199.2273406982422, 206.9663848876953, 214.70542907714844, 222.4444580078125, 230.18350219726562, 237.92254638671875, 245.66159057617188, 253.400634765625, 261.1396789550781, 268.87872314453125, 276.61773681640625, 284.3567810058594, 292.0958251953125, 299.8348693847656, 307.57391357421875, 315.3129577636719, 323.052001953125, 330.791015625, 338.5300598144531, 346.26910400390625, 354.0081481933594, 361.7471923828125, 369.4862365722656, 377.22528076171875, 384.9643249511719, 392.703369140625, 400.4423828125, 408.1814270019531, 415.92047119140625, 423.6595153808594]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 7.0, 8.0, 4.0, 7.0, 11.0, 10.0, 11.0, 17.0, 25.0, 14.0, 26.0, 21.0, 27.0, 29.0, 24.0, 34.0, 44.0, 42.0, 32.0, 42.0, 35.0, 43.0, 33.0, 47.0, 36.0, 48.0, 50.0, 30.0, 29.0, 21.0, 23.0, 24.0, 21.0, 13.0, 19.0, 19.0, 13.0, 13.0, 9.0, 13.0, 6.0, 8.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.33027648925781, -37.00249481201172, -35.674713134765625, -34.3469352722168, -33.0191535949707, -31.69137191772461, -30.363590240478516, -29.035808563232422, -27.70802879333496, -26.380247116088867, -25.052467346191406, -23.724685668945312, -22.39690399169922, -21.069124221801758, -19.741342544555664, -18.413562774658203, -17.08578109741211, -15.758000373840332, -14.430219650268555, -13.102437973022461, -11.774657249450684, -10.446876525878906, -9.119094848632812, -7.791314125061035, -6.463533401489258, -5.1357526779174805, -3.807971477508545, -2.4801905155181885, -1.152409553527832, 0.1753711700439453, 1.5031523704528809, 2.8309335708618164, 4.158714294433594, 5.486495018005371, 6.814276218414307, 8.142057418823242, 9.46983814239502, 10.797618865966797, 12.12540054321289, 13.453181266784668, 14.780961990356445, 16.10874366760254, 17.4365234375, 18.764305114746094, 20.092086791992188, 21.41986656188965, 22.747648239135742, 24.075428009033203, 25.403209686279297, 26.73099136352539, 28.05877113342285, 29.386552810668945, 30.714332580566406, 32.0421142578125, 33.369895935058594, 34.69767761230469, 36.02545928955078, 37.353240966796875, 38.68102264404297, 40.0088005065918, 41.33658218383789, 42.664363861083984, 43.99214553833008, 45.31992721557617, 46.647705078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 8.0, 12.0, 16.0, 9.0, 10.0, 14.0, 16.0, 17.0, 19.0, 20.0, 21.0, 21.0, 18.0, 31.0, 43.0, 33.0, 38.0, 26.0, 30.0, 34.0, 27.0, 36.0, 36.0, 42.0, 27.0, 33.0, 23.0, 31.0, 33.0, 30.0, 22.0, 24.0, 27.0, 21.0, 16.0, 19.0, 19.0, 19.0, 13.0, 13.0, 4.0, 1.0, 5.0, 7.0, 6.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0], "bins": [-8.0859375, -7.83544921875, -7.5849609375, -7.33447265625, -7.083984375, -6.83349609375, -6.5830078125, -6.33251953125, -6.08203125, -5.83154296875, -5.5810546875, -5.33056640625, -5.080078125, -4.82958984375, -4.5791015625, -4.32861328125, -4.078125, -3.82763671875, -3.5771484375, -3.32666015625, -3.076171875, -2.82568359375, -2.5751953125, -2.32470703125, -2.07421875, -1.82373046875, -1.5732421875, -1.32275390625, -1.072265625, -0.82177734375, -0.5712890625, -0.32080078125, -0.0703125, 0.18017578125, 0.4306640625, 0.68115234375, 0.931640625, 1.18212890625, 1.4326171875, 1.68310546875, 1.93359375, 2.18408203125, 2.4345703125, 2.68505859375, 2.935546875, 3.18603515625, 3.4365234375, 3.68701171875, 3.9375, 4.18798828125, 4.4384765625, 4.68896484375, 4.939453125, 5.18994140625, 5.4404296875, 5.69091796875, 5.94140625, 6.19189453125, 6.4423828125, 6.69287109375, 6.943359375, 7.19384765625, 7.4443359375, 7.69482421875, 7.9453125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 5.0, 5.0, 5.0, 11.0, 22.0, 25.0, 39.0, 74.0, 86.0, 115.0, 173.0, 240.0, 319.0, 489.0, 624.0, 908.0, 1225.0, 1583.0, 2323.0, 3179.0, 4392.0, 5941.0, 8161.0, 11395.0, 15932.0, 23069.0, 33705.0, 50438.0, 78361.0, 138589.0, 270871.0, 145942.0, 81390.0, 51951.0, 34610.0, 23708.0, 16333.0, 11660.0, 8455.0, 6111.0, 4363.0, 3191.0, 2378.0, 1679.0, 1205.0, 946.0, 708.0, 453.0, 366.0, 236.0, 172.0, 147.0, 80.0, 59.0, 48.0, 28.0, 14.0, 14.0, 6.0, 4.0, 4.0, 2.0, 3.0], "bins": [-1.4287109375, -1.3834075927734375, -1.338104248046875, -1.2928009033203125, -1.24749755859375, -1.2021942138671875, -1.156890869140625, -1.1115875244140625, -1.0662841796875, -1.0209808349609375, -0.975677490234375, -0.9303741455078125, -0.88507080078125, -0.8397674560546875, -0.794464111328125, -0.7491607666015625, -0.703857421875, -0.6585540771484375, -0.613250732421875, -0.5679473876953125, -0.52264404296875, -0.4773406982421875, -0.432037353515625, -0.3867340087890625, -0.3414306640625, -0.2961273193359375, -0.250823974609375, -0.2055206298828125, -0.16021728515625, -0.1149139404296875, -0.069610595703125, -0.0243072509765625, 0.02099609375, 0.0662994384765625, 0.111602783203125, 0.1569061279296875, 0.20220947265625, 0.2475128173828125, 0.292816162109375, 0.3381195068359375, 0.3834228515625, 0.4287261962890625, 0.474029541015625, 0.5193328857421875, 0.56463623046875, 0.6099395751953125, 0.655242919921875, 0.7005462646484375, 0.745849609375, 0.7911529541015625, 0.836456298828125, 0.8817596435546875, 0.92706298828125, 0.9723663330078125, 1.017669677734375, 1.0629730224609375, 1.1082763671875, 1.1535797119140625, 1.198883056640625, 1.2441864013671875, 1.28948974609375, 1.3347930908203125, 1.380096435546875, 1.4253997802734375, 1.470703125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 2.0, 3.0, 3.0, 9.0, 12.0, 10.0, 8.0, 13.0, 23.0, 14.0, 28.0, 22.0, 19.0, 27.0, 23.0, 28.0, 33.0, 35.0, 28.0, 36.0, 39.0, 34.0, 44.0, 1068.0, 37.0, 47.0, 27.0, 41.0, 28.0, 29.0, 27.0, 29.0, 29.0, 23.0, 27.0, 14.0, 20.0, 19.0, 13.0, 8.0, 16.0, 10.0, 7.0, 8.0, 2.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.03515625, -5.8477783203125, -5.660400390625, -5.4730224609375, -5.28564453125, -5.0982666015625, -4.910888671875, -4.7235107421875, -4.5361328125, -4.3487548828125, -4.161376953125, -3.9739990234375, -3.78662109375, -3.5992431640625, -3.411865234375, -3.2244873046875, -3.037109375, -2.8497314453125, -2.662353515625, -2.4749755859375, -2.28759765625, -2.1002197265625, -1.912841796875, -1.7254638671875, -1.5380859375, -1.3507080078125, -1.163330078125, -0.9759521484375, -0.78857421875, -0.6011962890625, -0.413818359375, -0.2264404296875, -0.0390625, 0.1483154296875, 0.335693359375, 0.5230712890625, 0.71044921875, 0.8978271484375, 1.085205078125, 1.2725830078125, 1.4599609375, 1.6473388671875, 1.834716796875, 2.0220947265625, 2.20947265625, 2.3968505859375, 2.584228515625, 2.7716064453125, 2.958984375, 3.1463623046875, 3.333740234375, 3.5211181640625, 3.70849609375, 3.8958740234375, 4.083251953125, 4.2706298828125, 4.4580078125, 4.6453857421875, 4.832763671875, 5.0201416015625, 5.20751953125, 5.3948974609375, 5.582275390625, 5.7696533203125, 5.95703125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 9.0, 6.0, 13.0, 16.0, 12.0, 28.0, 42.0, 55.0, 97.0, 198.0, 410.0, 733.0, 1408.0, 2639.0, 5163.0, 9819.0, 19096.0, 37219.0, 74532.0, 180411.0, 1486651.0, 145899.0, 64937.0, 32662.0, 16954.0, 8550.0, 4460.0, 2375.0, 1292.0, 617.0, 340.0, 186.0, 106.0, 63.0, 35.0, 28.0, 14.0, 11.0, 12.0, 10.0, 7.0, 3.0, 4.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.8941650390625, -2.802001953125, -2.7098388671875, -2.61767578125, -2.5255126953125, -2.433349609375, -2.3411865234375, -2.2490234375, -2.1568603515625, -2.064697265625, -1.9725341796875, -1.88037109375, -1.7882080078125, -1.696044921875, -1.6038818359375, -1.51171875, -1.4195556640625, -1.327392578125, -1.2352294921875, -1.14306640625, -1.0509033203125, -0.958740234375, -0.8665771484375, -0.7744140625, -0.6822509765625, -0.590087890625, -0.4979248046875, -0.40576171875, -0.3135986328125, -0.221435546875, -0.1292724609375, -0.037109375, 0.0550537109375, 0.147216796875, 0.2393798828125, 0.33154296875, 0.4237060546875, 0.515869140625, 0.6080322265625, 0.7001953125, 0.7923583984375, 0.884521484375, 0.9766845703125, 1.06884765625, 1.1610107421875, 1.253173828125, 1.3453369140625, 1.4375, 1.5296630859375, 1.621826171875, 1.7139892578125, 1.80615234375, 1.8983154296875, 1.990478515625, 2.0826416015625, 2.1748046875, 2.2669677734375, 2.359130859375, 2.4512939453125, 2.54345703125, 2.6356201171875, 2.727783203125, 2.8199462890625, 2.912109375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 6.0, 6.0, 20.0, 18.0, 21.0, 31.0, 23.0, 65.0, 74.0, 75.0, 97.0, 99.0, 94.0, 79.0, 80.0, 46.0, 53.0, 30.0, 24.0, 14.0, 14.0, 8.0, 4.0, 6.0, 4.0, 6.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018854141235351562, -0.0018296539783477783, -0.0017738938331604004, -0.0017181336879730225, -0.0016623735427856445, -0.0016066133975982666, -0.0015508532524108887, -0.0014950931072235107, -0.0014393329620361328, -0.0013835728168487549, -0.001327812671661377, -0.001272052526473999, -0.001216292381286621, -0.0011605322360992432, -0.0011047720909118652, -0.0010490119457244873, -0.0009932518005371094, -0.0009374916553497314, -0.0008817315101623535, -0.0008259713649749756, -0.0007702112197875977, -0.0007144510746002197, -0.0006586909294128418, -0.0006029307842254639, -0.0005471706390380859, -0.000491410493850708, -0.0004356503486633301, -0.00037989020347595215, -0.0003241300582885742, -0.0002683699131011963, -0.00021260976791381836, -0.00015684962272644043, -0.0001010894775390625, -4.532933235168457e-05, 1.043081283569336e-05, 6.619095802307129e-05, 0.00012195110321044922, 0.00017771124839782715, 0.00023347139358520508, 0.000289231538772583, 0.00034499168395996094, 0.00040075182914733887, 0.0004565119743347168, 0.0005122721195220947, 0.0005680322647094727, 0.0006237924098968506, 0.0006795525550842285, 0.0007353127002716064, 0.0007910728454589844, 0.0008468329906463623, 0.0009025931358337402, 0.0009583532810211182, 0.001014113426208496, 0.001069873571395874, 0.001125633716583252, 0.0011813938617706299, 0.0012371540069580078, 0.0012929141521453857, 0.0013486742973327637, 0.0014044344425201416, 0.0014601945877075195, 0.0015159547328948975, 0.0015717148780822754, 0.0016274750232696533, 0.0016832351684570312]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 2.0, 9.0, 5.0, 10.0, 7.0, 19.0, 13.0, 18.0, 39.0, 40.0, 54.0, 84.0, 131.0, 207.0, 439.0, 1266.0, 1003830.0, 40671.0, 802.0, 338.0, 176.0, 118.0, 74.0, 53.0, 52.0, 28.0, 25.0, 16.0, 9.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.030426025390625, -0.02940511703491211, -0.02838420867919922, -0.027363300323486328, -0.026342391967773438, -0.025321483612060547, -0.024300575256347656, -0.023279666900634766, -0.022258758544921875, -0.021237850189208984, -0.020216941833496094, -0.019196033477783203, -0.018175125122070312, -0.017154216766357422, -0.01613330841064453, -0.01511240005493164, -0.01409149169921875, -0.01307058334350586, -0.012049674987792969, -0.011028766632080078, -0.010007858276367188, -0.008986949920654297, -0.007966041564941406, -0.006945133209228516, -0.005924224853515625, -0.004903316497802734, -0.0038824081420898438, -0.002861499786376953, -0.0018405914306640625, -0.0008196830749511719, 0.00020122528076171875, 0.0012221336364746094, 0.0022430419921875, 0.0032639503479003906, 0.004284858703613281, 0.005305767059326172, 0.0063266754150390625, 0.007347583770751953, 0.008368492126464844, 0.009389400482177734, 0.010410308837890625, 0.011431217193603516, 0.012452125549316406, 0.013473033905029297, 0.014493942260742188, 0.015514850616455078, 0.01653575897216797, 0.01755666732788086, 0.01857757568359375, 0.01959848403930664, 0.02061939239501953, 0.021640300750732422, 0.022661209106445312, 0.023682117462158203, 0.024703025817871094, 0.025723934173583984, 0.026744842529296875, 0.027765750885009766, 0.028786659240722656, 0.029807567596435547, 0.030828475952148438, 0.03184938430786133, 0.03287029266357422, 0.03389120101928711, 0.034912109375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 10.0, 36.0, 173.0, 344.0, 320.0, 99.0, 27.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002508872654289007, -0.002445819089189172, -0.00238276575691998, -0.0023197121918201447, -0.0022566586267203093, -0.002193605061620474, -0.002130551729351282, -0.0020674981642514467, -0.0020044445991516113, -0.0019413911504670978, -0.0018783375853672624, -0.0018152841366827488, -0.0017522305715829134, -0.0016891771228983998, -0.0016261236742138863, -0.0015630701091140509, -0.0015000166604295373, -0.0014369632117450237, -0.0013739096466451883, -0.0013108561979606748, -0.0012478026328608394, -0.0011847491841763258, -0.0011216956190764904, -0.0010586421703919768, -0.0009955887217074633, -0.0009325352148152888, -0.0008694817079231143, -0.0008064282592386007, -0.0007433746941387653, -0.0006803212454542518, -0.0006172677385620773, -0.0005542142316699028, -0.0004911605501547456, -0.0004281070432625711, -0.0003650535363703966, -0.0003020000585820526, -0.0002389465516898781, -0.00017589304479770362, -0.0001128395670093596, -4.9786060117185116e-05, 1.3267446774989367e-05, 7.632094639120623e-05, 0.0001393744460074231, 0.00020242793834768236, 0.00026548144523985684, 0.0003285349521320313, 0.00039158842992037535, 0.00045464193681254983, 0.0005176954437047243, 0.0005807489505968988, 0.0006438024574890733, 0.0007068559061735868, 0.0007699094712734222, 0.0008329629199579358, 0.0008960164268501103, 0.0009590699337422848, 0.0010221234988421202, 0.0010851769475266337, 0.0011482305126264691, 0.0012112839613109827, 0.001274337526410818, 0.0013373909750953317, 0.0014004444237798452, 0.0014634979888796806, 0.0015265514375641942]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 5.0, 7.0, 19.0, 13.0, 13.0, 11.0, 19.0, 24.0, 23.0, 21.0, 25.0, 27.0, 25.0, 31.0, 30.0, 31.0, 38.0, 38.0, 48.0, 49.0, 38.0, 44.0, 35.0, 28.0, 38.0, 33.0, 36.0, 27.0, 23.0, 20.0, 16.0, 26.0, 18.0, 16.0, 22.0, 12.0, 14.0, 10.0, 8.0, 5.0, 8.0, 5.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0005908608436584473, -0.0005725296214222908, -0.0005541983991861343, -0.0005358671769499779, -0.0005175359547138214, -0.000499204732477665, -0.0004808735102415085, -0.000462542288005352, -0.00044421106576919556, -0.0004258798435330391, -0.00040754862129688263, -0.00038921739906072617, -0.0003708861768245697, -0.00035255495458841324, -0.0003342237323522568, -0.0003158925101161003, -0.00029756128787994385, -0.0002792300656437874, -0.0002608988434076309, -0.00024256762117147446, -0.000224236398935318, -0.00020590517669916153, -0.00018757395446300507, -0.0001692427322268486, -0.00015091150999069214, -0.00013258028775453568, -0.00011424906551837921, -9.591784328222275e-05, -7.758662104606628e-05, -5.925539880990982e-05, -4.092417657375336e-05, -2.2592954337596893e-05, -4.26173210144043e-06, 1.4069490134716034e-05, 3.24007123708725e-05, 5.073193460702896e-05, 6.906315684318542e-05, 8.739437907934189e-05, 0.00010572560131549835, 0.00012405682355165482, 0.00014238804578781128, 0.00016071926802396774, 0.0001790504902601242, 0.00019738171249628067, 0.00021571293473243713, 0.0002340441569685936, 0.00025237537920475006, 0.0002707066014409065, 0.000289037823677063, 0.00030736904591321945, 0.0003257002681493759, 0.0003440314903855324, 0.00036236271262168884, 0.0003806939348578453, 0.00039902515709400177, 0.00041735637933015823, 0.0004356876015663147, 0.00045401882380247116, 0.0004723500460386276, 0.0004906812682747841, 0.0005090124905109406, 0.000527343712747097, 0.0005456749349832535, 0.0005640061572194099, 0.0005823373794555664]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 3.0, 5.0, 8.0, 8.0, 12.0, 16.0, 9.0, 10.0, 14.0, 16.0, 17.0, 19.0, 20.0, 21.0, 21.0, 18.0, 31.0, 43.0, 33.0, 38.0, 26.0, 30.0, 34.0, 27.0, 36.0, 36.0, 42.0, 27.0, 33.0, 23.0, 31.0, 33.0, 30.0, 22.0, 24.0, 27.0, 21.0, 16.0, 19.0, 19.0, 19.0, 13.0, 13.0, 4.0, 1.0, 5.0, 7.0, 6.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 4.0], "bins": [-8.0859375, -7.83544921875, -7.5849609375, -7.33447265625, -7.083984375, -6.83349609375, -6.5830078125, -6.33251953125, -6.08203125, -5.83154296875, -5.5810546875, -5.33056640625, -5.080078125, -4.82958984375, -4.5791015625, -4.32861328125, -4.078125, -3.82763671875, -3.5771484375, -3.32666015625, -3.076171875, -2.82568359375, -2.5751953125, -2.32470703125, -2.07421875, -1.82373046875, -1.5732421875, -1.32275390625, -1.072265625, -0.82177734375, -0.5712890625, -0.32080078125, -0.0703125, 0.18017578125, 0.4306640625, 0.68115234375, 0.931640625, 1.18212890625, 1.4326171875, 1.68310546875, 1.93359375, 2.18408203125, 2.4345703125, 2.68505859375, 2.935546875, 3.18603515625, 3.4365234375, 3.68701171875, 3.9375, 4.18798828125, 4.4384765625, 4.68896484375, 4.939453125, 5.18994140625, 5.4404296875, 5.69091796875, 5.94140625, 6.19189453125, 6.4423828125, 6.69287109375, 6.943359375, 7.19384765625, 7.4443359375, 7.69482421875, 7.9453125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 7.0, 4.0, 3.0, 4.0, 6.0, 12.0, 14.0, 13.0, 19.0, 31.0, 40.0, 45.0, 56.0, 82.0, 92.0, 108.0, 157.0, 202.0, 256.0, 372.0, 464.0, 742.0, 1153.0, 1858.0, 3819.0, 7782.0, 19465.0, 51031.0, 140905.0, 339326.0, 295187.0, 113280.0, 41074.0, 15756.0, 6673.0, 3228.0, 1775.0, 1005.0, 679.0, 450.0, 309.0, 247.0, 182.0, 149.0, 108.0, 96.0, 57.0, 56.0, 58.0, 34.0, 24.0, 21.0, 16.0, 9.0, 7.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 2.0, 3.0], "bins": [-8.71875, -8.4365234375, -8.154296875, -7.8720703125, -7.58984375, -7.3076171875, -7.025390625, -6.7431640625, -6.4609375, -6.1787109375, -5.896484375, -5.6142578125, -5.33203125, -5.0498046875, -4.767578125, -4.4853515625, -4.203125, -3.9208984375, -3.638671875, -3.3564453125, -3.07421875, -2.7919921875, -2.509765625, -2.2275390625, -1.9453125, -1.6630859375, -1.380859375, -1.0986328125, -0.81640625, -0.5341796875, -0.251953125, 0.0302734375, 0.3125, 0.5947265625, 0.876953125, 1.1591796875, 1.44140625, 1.7236328125, 2.005859375, 2.2880859375, 2.5703125, 2.8525390625, 3.134765625, 3.4169921875, 3.69921875, 3.9814453125, 4.263671875, 4.5458984375, 4.828125, 5.1103515625, 5.392578125, 5.6748046875, 5.95703125, 6.2392578125, 6.521484375, 6.8037109375, 7.0859375, 7.3681640625, 7.650390625, 7.9326171875, 8.21484375, 8.4970703125, 8.779296875, 9.0615234375, 9.34375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 6.0, 5.0, 9.0, 9.0, 11.0, 18.0, 16.0, 39.0, 33.0, 43.0, 41.0, 62.0, 81.0, 79.0, 244.0, 1701.0, 230.0, 85.0, 82.0, 51.0, 40.0, 38.0, 36.0, 28.0, 11.0, 11.0, 12.0, 13.0, 3.0, 12.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.875, -41.66650390625, -40.4580078125, -39.24951171875, -38.041015625, -36.83251953125, -35.6240234375, -34.41552734375, -33.20703125, -31.99853515625, -30.7900390625, -29.58154296875, -28.373046875, -27.16455078125, -25.9560546875, -24.74755859375, -23.5390625, -22.33056640625, -21.1220703125, -19.91357421875, -18.705078125, -17.49658203125, -16.2880859375, -15.07958984375, -13.87109375, -12.66259765625, -11.4541015625, -10.24560546875, -9.037109375, -7.82861328125, -6.6201171875, -5.41162109375, -4.203125, -2.99462890625, -1.7861328125, -0.57763671875, 0.630859375, 1.83935546875, 3.0478515625, 4.25634765625, 5.46484375, 6.67333984375, 7.8818359375, 9.09033203125, 10.298828125, 11.50732421875, 12.7158203125, 13.92431640625, 15.1328125, 16.34130859375, 17.5498046875, 18.75830078125, 19.966796875, 21.17529296875, 22.3837890625, 23.59228515625, 24.80078125, 26.00927734375, 27.2177734375, 28.42626953125, 29.634765625, 30.84326171875, 32.0517578125, 33.26025390625, 34.46875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 10.0, 10.0, 10.0, 20.0, 24.0, 27.0, 41.0, 59.0, 82.0, 120.0, 189.0, 262.0, 527.0, 1822.0, 75267.0, 3039079.0, 25539.0, 1235.0, 493.0, 288.0, 152.0, 130.0, 81.0, 61.0, 41.0, 37.0, 21.0, 14.0, 16.0, 11.0, 4.0, 6.0, 5.0, 2.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.4375, -45.82373046875, -44.2099609375, -42.59619140625, -40.982421875, -39.36865234375, -37.7548828125, -36.14111328125, -34.52734375, -32.91357421875, -31.2998046875, -29.68603515625, -28.072265625, -26.45849609375, -24.8447265625, -23.23095703125, -21.6171875, -20.00341796875, -18.3896484375, -16.77587890625, -15.162109375, -13.54833984375, -11.9345703125, -10.32080078125, -8.70703125, -7.09326171875, -5.4794921875, -3.86572265625, -2.251953125, -0.63818359375, 0.9755859375, 2.58935546875, 4.203125, 5.81689453125, 7.4306640625, 9.04443359375, 10.658203125, 12.27197265625, 13.8857421875, 15.49951171875, 17.11328125, 18.72705078125, 20.3408203125, 21.95458984375, 23.568359375, 25.18212890625, 26.7958984375, 28.40966796875, 30.0234375, 31.63720703125, 33.2509765625, 34.86474609375, 36.478515625, 38.09228515625, 39.7060546875, 41.31982421875, 42.93359375, 44.54736328125, 46.1611328125, 47.77490234375, 49.388671875, 51.00244140625, 52.6162109375, 54.22998046875, 55.84375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 31.0, 633.0, 347.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-354.1091003417969, -347.0032653808594, -339.89739990234375, -332.79156494140625, -325.6856994628906, -318.5798645019531, -311.4739990234375, -304.3681640625, -297.2623291015625, -290.156494140625, -283.0506286621094, -275.9447937011719, -268.83892822265625, -261.73309326171875, -254.6272430419922, -247.52139282226562, -240.41552734375, -233.30967712402344, -226.20382690429688, -219.0979766845703, -211.99212646484375, -204.88629150390625, -197.7804412841797, -190.67459106445312, -183.56874084472656, -176.462890625, -169.35704040527344, -162.25119018554688, -155.14535522460938, -148.03948974609375, -140.93365478515625, -133.8278045654297, -126.72193908691406, -119.6160888671875, -112.51023864746094, -105.4043960571289, -98.29854583740234, -91.19269561767578, -84.08685302734375, -76.98100280761719, -69.87515258789062, -62.76930236816406, -55.663455963134766, -48.55760955810547, -41.451759338378906, -34.345909118652344, -27.240062713623047, -20.13421630859375, -13.028366088867188, -5.922517776489258, 1.1833305358886719, 8.289178848266602, 15.395027160644531, 22.500877380371094, 29.60672378540039, 36.71257019042969, 43.81842041015625, 50.92427062988281, 58.03011703491211, 65.1359634399414, 72.24181365966797, 79.34766387939453, 86.45350646972656, 93.55935668945312, 100.66520690917969]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 1.0, 9.0, 12.0, 10.0, 10.0, 15.0, 11.0, 15.0, 15.0, 24.0, 20.0, 18.0, 20.0, 22.0, 35.0, 30.0, 30.0, 36.0, 30.0, 40.0, 34.0, 38.0, 46.0, 38.0, 44.0, 36.0, 34.0, 26.0, 29.0, 26.0, 23.0, 28.0, 32.0, 24.0, 18.0, 17.0, 10.0, 16.0, 15.0, 7.0, 8.0, 8.0, 7.0, 6.0, 5.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.524505615234375, -51.7430534362793, -49.96159744262695, -48.180145263671875, -46.3986930847168, -44.61724090576172, -42.835784912109375, -41.0543327331543, -39.27288055419922, -37.49142837524414, -35.7099723815918, -33.92852020263672, -32.14706802368164, -30.36561393737793, -28.58415985107422, -26.80270767211914, -25.021251678466797, -23.239797592163086, -21.458345413208008, -19.676891326904297, -17.89543914794922, -16.113985061645508, -14.332530975341797, -12.551077842712402, -10.769624710083008, -8.988171577453613, -7.2067179679870605, -5.425264358520508, -3.6438112258911133, -1.8623580932617188, -0.08090400695800781, 1.7005491256713867, 3.4820022583007812, 5.263455390930176, 7.0449090003967285, 8.826362609863281, 10.607815742492676, 12.38926887512207, 14.170722961425781, 15.952176094055176, 17.73362922668457, 19.51508331298828, 21.29653549194336, 23.07798957824707, 24.85944366455078, 26.64089584350586, 28.42234992980957, 30.20380401611328, 31.98525619506836, 33.76670837402344, 35.54816436767578, 37.32961654663086, 39.11106872558594, 40.89252471923828, 42.67397689819336, 44.45542907714844, 46.23688507080078, 48.01833724975586, 49.7997932434082, 51.58124542236328, 53.36269760131836, 55.14414978027344, 56.92560577392578, 58.70705795288086, 60.48851013183594]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 2.0, 6.0, 3.0, 5.0, 11.0, 11.0, 8.0, 16.0, 10.0, 12.0, 17.0, 12.0, 22.0, 27.0, 27.0, 27.0, 31.0, 28.0, 29.0, 40.0, 39.0, 20.0, 37.0, 38.0, 40.0, 27.0, 26.0, 32.0, 35.0, 32.0, 33.0, 36.0, 28.0, 27.0, 24.0, 21.0, 26.0, 19.0, 14.0, 19.0, 14.0, 11.0, 14.0, 9.0, 11.0, 3.0, 5.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.328125, -8.0726318359375, -7.817138671875, -7.5616455078125, -7.30615234375, -7.0506591796875, -6.795166015625, -6.5396728515625, -6.2841796875, -6.0286865234375, -5.773193359375, -5.5177001953125, -5.26220703125, -5.0067138671875, -4.751220703125, -4.4957275390625, -4.240234375, -3.9847412109375, -3.729248046875, -3.4737548828125, -3.21826171875, -2.9627685546875, -2.707275390625, -2.4517822265625, -2.1962890625, -1.9407958984375, -1.685302734375, -1.4298095703125, -1.17431640625, -0.9188232421875, -0.663330078125, -0.4078369140625, -0.15234375, 0.1031494140625, 0.358642578125, 0.6141357421875, 0.86962890625, 1.1251220703125, 1.380615234375, 1.6361083984375, 1.8916015625, 2.1470947265625, 2.402587890625, 2.6580810546875, 2.91357421875, 3.1690673828125, 3.424560546875, 3.6800537109375, 3.935546875, 4.1910400390625, 4.446533203125, 4.7020263671875, 4.95751953125, 5.2130126953125, 5.468505859375, 5.7239990234375, 5.9794921875, 6.2349853515625, 6.490478515625, 6.7459716796875, 7.00146484375, 7.2569580078125, 7.512451171875, 7.7679443359375, 8.0234375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 8.0, 3.0, 3.0, 6.0, 5.0, 11.0, 9.0, 18.0, 16.0, 17.0, 30.0, 36.0, 59.0, 57.0, 73.0, 120.0, 158.0, 183.0, 302.0, 372.0, 507.0, 8224.0, 4181353.0, 988.0, 420.0, 353.0, 233.0, 192.0, 125.0, 83.0, 74.0, 58.0, 50.0, 28.0, 21.0, 21.0, 13.0, 12.0, 18.0, 11.0, 2.0, 4.0, 4.0, 1.0, 2.0, 6.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-235.75, -229.064453125, -222.37890625, -215.693359375, -209.0078125, -202.322265625, -195.63671875, -188.951171875, -182.265625, -175.580078125, -168.89453125, -162.208984375, -155.5234375, -148.837890625, -142.15234375, -135.466796875, -128.78125, -122.095703125, -115.41015625, -108.724609375, -102.0390625, -95.353515625, -88.66796875, -81.982421875, -75.296875, -68.611328125, -61.92578125, -55.240234375, -48.5546875, -41.869140625, -35.18359375, -28.498046875, -21.8125, -15.126953125, -8.44140625, -1.755859375, 4.9296875, 11.615234375, 18.30078125, 24.986328125, 31.671875, 38.357421875, 45.04296875, 51.728515625, 58.4140625, 65.099609375, 71.78515625, 78.470703125, 85.15625, 91.841796875, 98.52734375, 105.212890625, 111.8984375, 118.583984375, 125.26953125, 131.955078125, 138.640625, 145.326171875, 152.01171875, 158.697265625, 165.3828125, 172.068359375, 178.75390625, 185.439453125, 192.125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 7.0, 11.0, 16.0, 36.0, 51.0, 86.0, 160.0, 347.0, 746.0, 1062.0, 705.0, 358.0, 208.0, 104.0, 65.0, 36.0, 21.0, 21.0, 14.0, 8.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.140625, -23.350341796875, -22.56005859375, -21.769775390625, -20.9794921875, -20.189208984375, -19.39892578125, -18.608642578125, -17.818359375, -17.028076171875, -16.23779296875, -15.447509765625, -14.6572265625, -13.866943359375, -13.07666015625, -12.286376953125, -11.49609375, -10.705810546875, -9.91552734375, -9.125244140625, -8.3349609375, -7.544677734375, -6.75439453125, -5.964111328125, -5.173828125, -4.383544921875, -3.59326171875, -2.802978515625, -2.0126953125, -1.222412109375, -0.43212890625, 0.358154296875, 1.1484375, 1.938720703125, 2.72900390625, 3.519287109375, 4.3095703125, 5.099853515625, 5.89013671875, 6.680419921875, 7.470703125, 8.260986328125, 9.05126953125, 9.841552734375, 10.6318359375, 11.422119140625, 12.21240234375, 13.002685546875, 13.79296875, 14.583251953125, 15.37353515625, 16.163818359375, 16.9541015625, 17.744384765625, 18.53466796875, 19.324951171875, 20.115234375, 20.905517578125, 21.69580078125, 22.486083984375, 23.2763671875, 24.066650390625, 24.85693359375, 25.647216796875, 26.4375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 7.0, 2.0, 7.0, 9.0, 7.0, 20.0, 21.0, 12.0, 20.0, 41.0, 24.0, 33.0, 25.0, 36.0, 52.0, 78.0, 119.0, 367.0, 3011.0, 3813125.0, 375196.0, 1352.0, 247.0, 97.0, 72.0, 43.0, 38.0, 37.0, 32.0, 27.0, 22.0, 17.0, 14.0, 17.0, 12.0, 7.0, 8.0, 5.0, 4.0, 4.0, 6.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.125, -90.974609375, -87.82421875, -84.673828125, -81.5234375, -78.373046875, -75.22265625, -72.072265625, -68.921875, -65.771484375, -62.62109375, -59.470703125, -56.3203125, -53.169921875, -50.01953125, -46.869140625, -43.71875, -40.568359375, -37.41796875, -34.267578125, -31.1171875, -27.966796875, -24.81640625, -21.666015625, -18.515625, -15.365234375, -12.21484375, -9.064453125, -5.9140625, -2.763671875, 0.38671875, 3.537109375, 6.6875, 9.837890625, 12.98828125, 16.138671875, 19.2890625, 22.439453125, 25.58984375, 28.740234375, 31.890625, 35.041015625, 38.19140625, 41.341796875, 44.4921875, 47.642578125, 50.79296875, 53.943359375, 57.09375, 60.244140625, 63.39453125, 66.544921875, 69.6953125, 72.845703125, 75.99609375, 79.146484375, 82.296875, 85.447265625, 88.59765625, 91.748046875, 94.8984375, 98.048828125, 101.19921875, 104.349609375, 107.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 184.0, 807.0, 21.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-755.7564697265625, -741.8363647460938, -727.9163208007812, -713.9962158203125, -700.076171875, -686.1560668945312, -672.2359619140625, -658.31591796875, -644.3958129882812, -630.4757080078125, -616.5556640625, -602.6355590820312, -588.7155151367188, -574.79541015625, -560.8753662109375, -546.9552612304688, -533.0352172851562, -519.1151123046875, -505.195068359375, -491.27496337890625, -477.3548889160156, -463.434814453125, -449.5147399902344, -435.59466552734375, -421.674560546875, -407.7544860839844, -393.83441162109375, -379.914306640625, -365.9942321777344, -352.07415771484375, -338.1540832519531, -324.2340087890625, -310.3139343261719, -296.39385986328125, -282.4737854003906, -268.5537109375, -254.6336212158203, -240.71353149414062, -226.79345703125, -212.87338256835938, -198.95330810546875, -185.03323364257812, -171.11314392089844, -157.1930694580078, -143.2729949951172, -129.3529052734375, -115.43283081054688, -101.51275634765625, -87.59266662597656, -73.6725845336914, -59.75251007080078, -45.832427978515625, -31.912349700927734, -17.992271423339844, -4.0721893310546875, 9.847885131835938, 23.767967224121094, 37.688045501708984, 51.608123779296875, 65.52820587158203, 79.44828796386719, 93.36836242675781, 107.28844451904297, 121.2085189819336, 135.12860107421875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 7.0, 9.0, 11.0, 16.0, 25.0, 20.0, 28.0, 35.0, 31.0, 31.0, 31.0, 34.0, 52.0, 43.0, 45.0, 53.0, 41.0, 48.0, 29.0, 48.0, 43.0, 42.0, 42.0, 35.0, 26.0, 31.0, 35.0, 26.0, 10.0, 11.0, 16.0, 9.0, 10.0, 5.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.16009521484375, -47.26654815673828, -45.37300109863281, -43.479454040527344, -41.585906982421875, -39.692359924316406, -37.79881286621094, -35.90526580810547, -34.01171875, -32.11817169189453, -30.224624633789062, -28.331077575683594, -26.437530517578125, -24.543983459472656, -22.650436401367188, -20.75688934326172, -18.86334228515625, -16.96979522705078, -15.076248168945312, -13.182701110839844, -11.289154052734375, -9.395606994628906, -7.5020599365234375, -5.608512878417969, -3.7149658203125, -1.8214187622070312, 0.0721282958984375, 1.9656753540039062, 3.859222412109375, 5.752769470214844, 7.6463165283203125, 9.539863586425781, 11.43341064453125, 13.326957702636719, 15.220504760742188, 17.114051818847656, 19.007598876953125, 20.901145935058594, 22.794692993164062, 24.68824005126953, 26.581787109375, 28.47533416748047, 30.368881225585938, 32.262428283691406, 34.155975341796875, 36.049522399902344, 37.94306945800781, 39.83661651611328, 41.73016357421875, 43.62371063232422, 45.51725769042969, 47.410804748535156, 49.304351806640625, 51.197898864746094, 53.09144592285156, 54.98499298095703, 56.8785400390625, 58.77208709716797, 60.66563415527344, 62.559181213378906, 64.45272827148438, 66.34627532958984, 68.23982238769531, 70.13336944580078, 72.02691650390625]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 6.0, 11.0, 9.0, 16.0, 14.0, 19.0, 17.0, 22.0, 26.0, 20.0, 23.0, 37.0, 29.0, 40.0, 33.0, 33.0, 28.0, 29.0, 23.0, 37.0, 38.0, 54.0, 32.0, 32.0, 33.0, 35.0, 24.0, 33.0, 30.0, 27.0, 29.0, 24.0, 23.0, 23.0, 12.0, 10.0, 17.0, 9.0, 9.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4219970703125, -8.148681640625, -7.8753662109375, -7.60205078125, -7.3287353515625, -7.055419921875, -6.7821044921875, -6.5087890625, -6.2354736328125, -5.962158203125, -5.6888427734375, -5.41552734375, -5.1422119140625, -4.868896484375, -4.5955810546875, -4.322265625, -4.0489501953125, -3.775634765625, -3.5023193359375, -3.22900390625, -2.9556884765625, -2.682373046875, -2.4090576171875, -2.1357421875, -1.8624267578125, -1.589111328125, -1.3157958984375, -1.04248046875, -0.7691650390625, -0.495849609375, -0.2225341796875, 0.05078125, 0.3240966796875, 0.597412109375, 0.8707275390625, 1.14404296875, 1.4173583984375, 1.690673828125, 1.9639892578125, 2.2373046875, 2.5106201171875, 2.783935546875, 3.0572509765625, 3.33056640625, 3.6038818359375, 3.877197265625, 4.1505126953125, 4.423828125, 4.6971435546875, 4.970458984375, 5.2437744140625, 5.51708984375, 5.7904052734375, 6.063720703125, 6.3370361328125, 6.6103515625, 6.8836669921875, 7.156982421875, 7.4302978515625, 7.70361328125, 7.9769287109375, 8.250244140625, 8.5235595703125, 8.796875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 7.0, 11.0, 9.0, 24.0, 35.0, 53.0, 75.0, 101.0, 189.0, 294.0, 468.0, 780.0, 1297.0, 2107.0, 3507.0, 5734.0, 9724.0, 16434.0, 27646.0, 47533.0, 84567.0, 163902.0, 336464.0, 155210.0, 80767.0, 45540.0, 26589.0, 15860.0, 9386.0, 5644.0, 3387.0, 2023.0, 1200.0, 746.0, 489.0, 283.0, 177.0, 110.0, 64.0, 42.0, 25.0, 17.0, 16.0, 6.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.177734375, -2.1085205078125, -2.039306640625, -1.9700927734375, -1.90087890625, -1.8316650390625, -1.762451171875, -1.6932373046875, -1.6240234375, -1.5548095703125, -1.485595703125, -1.4163818359375, -1.34716796875, -1.2779541015625, -1.208740234375, -1.1395263671875, -1.0703125, -1.0010986328125, -0.931884765625, -0.8626708984375, -0.79345703125, -0.7242431640625, -0.655029296875, -0.5858154296875, -0.5166015625, -0.4473876953125, -0.378173828125, -0.3089599609375, -0.23974609375, -0.1705322265625, -0.101318359375, -0.0321044921875, 0.037109375, 0.1063232421875, 0.175537109375, 0.2447509765625, 0.31396484375, 0.3831787109375, 0.452392578125, 0.5216064453125, 0.5908203125, 0.6600341796875, 0.729248046875, 0.7984619140625, 0.86767578125, 0.9368896484375, 1.006103515625, 1.0753173828125, 1.14453125, 1.2137451171875, 1.282958984375, 1.3521728515625, 1.42138671875, 1.4906005859375, 1.559814453125, 1.6290283203125, 1.6982421875, 1.7674560546875, 1.836669921875, 1.9058837890625, 1.97509765625, 2.0443115234375, 2.113525390625, 2.1827392578125, 2.251953125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 2.0, 6.0, 5.0, 1.0, 3.0, 10.0, 7.0, 10.0, 11.0, 16.0, 24.0, 25.0, 28.0, 39.0, 38.0, 29.0, 35.0, 44.0, 32.0, 43.0, 48.0, 51.0, 1059.0, 41.0, 38.0, 39.0, 39.0, 46.0, 42.0, 34.0, 27.0, 26.0, 19.0, 23.0, 15.0, 16.0, 12.0, 11.0, 12.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.921875, -5.72161865234375, -5.5213623046875, -5.32110595703125, -5.120849609375, -4.92059326171875, -4.7203369140625, -4.52008056640625, -4.31982421875, -4.11956787109375, -3.9193115234375, -3.71905517578125, -3.518798828125, -3.31854248046875, -3.1182861328125, -2.91802978515625, -2.7177734375, -2.51751708984375, -2.3172607421875, -2.11700439453125, -1.916748046875, -1.71649169921875, -1.5162353515625, -1.31597900390625, -1.11572265625, -0.91546630859375, -0.7152099609375, -0.51495361328125, -0.314697265625, -0.11444091796875, 0.0858154296875, 0.28607177734375, 0.486328125, 0.68658447265625, 0.8868408203125, 1.08709716796875, 1.287353515625, 1.48760986328125, 1.6878662109375, 1.88812255859375, 2.08837890625, 2.28863525390625, 2.4888916015625, 2.68914794921875, 2.889404296875, 3.08966064453125, 3.2899169921875, 3.49017333984375, 3.6904296875, 3.89068603515625, 4.0909423828125, 4.29119873046875, 4.491455078125, 4.69171142578125, 4.8919677734375, 5.09222412109375, 5.29248046875, 5.49273681640625, 5.6929931640625, 5.89324951171875, 6.093505859375, 6.29376220703125, 6.4940185546875, 6.69427490234375, 6.89453125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 11.0, 17.0, 25.0, 28.0, 59.0, 107.0, 186.0, 336.0, 632.0, 1061.0, 2067.0, 4037.0, 8237.0, 16697.0, 35776.0, 81755.0, 231268.0, 1484405.0, 129298.0, 53522.0, 24266.0, 11364.0, 5727.0, 2849.0, 1545.0, 783.0, 426.0, 285.0, 135.0, 87.0, 38.0, 24.0, 20.0, 16.0, 6.0, 4.0, 5.0, 3.0, 6.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.330078125, -3.23284912109375, -3.1356201171875, -3.03839111328125, -2.941162109375, -2.84393310546875, -2.7467041015625, -2.64947509765625, -2.55224609375, -2.45501708984375, -2.3577880859375, -2.26055908203125, -2.163330078125, -2.06610107421875, -1.9688720703125, -1.87164306640625, -1.7744140625, -1.67718505859375, -1.5799560546875, -1.48272705078125, -1.385498046875, -1.28826904296875, -1.1910400390625, -1.09381103515625, -0.99658203125, -0.89935302734375, -0.8021240234375, -0.70489501953125, -0.607666015625, -0.51043701171875, -0.4132080078125, -0.31597900390625, -0.21875, -0.12152099609375, -0.0242919921875, 0.07293701171875, 0.170166015625, 0.26739501953125, 0.3646240234375, 0.46185302734375, 0.55908203125, 0.65631103515625, 0.7535400390625, 0.85076904296875, 0.947998046875, 1.04522705078125, 1.1424560546875, 1.23968505859375, 1.3369140625, 1.43414306640625, 1.5313720703125, 1.62860107421875, 1.725830078125, 1.82305908203125, 1.9202880859375, 2.01751708984375, 2.11474609375, 2.21197509765625, 2.3092041015625, 2.40643310546875, 2.503662109375, 2.60089111328125, 2.6981201171875, 2.79534912109375, 2.892578125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 1.0, 2.0, 4.0, 7.0, 3.0, 5.0, 14.0, 9.0, 10.0, 6.0, 20.0, 30.0, 25.0, 30.0, 40.0, 51.0, 58.0, 86.0, 71.0, 68.0, 74.0, 60.0, 54.0, 48.0, 39.0, 36.0, 21.0, 18.0, 23.0, 17.0, 12.0, 15.0, 7.0, 6.0, 8.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0014390945434570312, -0.001394912600517273, -0.0013507306575775146, -0.0013065487146377563, -0.001262366771697998, -0.0012181848287582397, -0.0011740028858184814, -0.0011298209428787231, -0.0010856389999389648, -0.0010414570569992065, -0.0009972751140594482, -0.0009530931711196899, -0.0009089112281799316, -0.0008647292852401733, -0.000820547342300415, -0.0007763653993606567, -0.0007321834564208984, -0.0006880015134811401, -0.0006438195705413818, -0.0005996376276016235, -0.0005554556846618652, -0.0005112737417221069, -0.00046709179878234863, -0.00042290985584259033, -0.00037872791290283203, -0.00033454596996307373, -0.00029036402702331543, -0.00024618208408355713, -0.00020200014114379883, -0.00015781819820404053, -0.00011363625526428223, -6.945431232452393e-05, -2.5272369384765625e-05, 1.8909573554992676e-05, 6.309151649475098e-05, 0.00010727345943450928, 0.00015145540237426758, 0.00019563734531402588, 0.00023981928825378418, 0.0002840012311935425, 0.0003281831741333008, 0.0003723651170730591, 0.0004165470600128174, 0.0004607290029525757, 0.000504910945892334, 0.0005490928888320923, 0.0005932748317718506, 0.0006374567747116089, 0.0006816387176513672, 0.0007258206605911255, 0.0007700026035308838, 0.0008141845464706421, 0.0008583664894104004, 0.0009025484323501587, 0.000946730375289917, 0.0009909123182296753, 0.0010350942611694336, 0.001079276204109192, 0.0011234581470489502, 0.0011676400899887085, 0.0012118220329284668, 0.001256003975868225, 0.0013001859188079834, 0.0013443678617477417, 0.0013885498046875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 8.0, 4.0, 14.0, 10.0, 10.0, 19.0, 27.0, 49.0, 35.0, 57.0, 84.0, 105.0, 151.0, 229.0, 338.0, 716.0, 2348.0, 1007031.0, 34762.0, 1063.0, 475.0, 286.0, 206.0, 143.0, 88.0, 69.0, 41.0, 28.0, 29.0, 22.0, 22.0, 9.0, 12.0, 8.0, 7.0, 7.0, 1.0, 12.0, 5.0, 4.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.02593994140625, -0.025122642517089844, -0.024305343627929688, -0.02348804473876953, -0.022670745849609375, -0.02185344696044922, -0.021036148071289062, -0.020218849182128906, -0.01940155029296875, -0.018584251403808594, -0.017766952514648438, -0.01694965362548828, -0.016132354736328125, -0.015315055847167969, -0.014497756958007812, -0.013680458068847656, -0.0128631591796875, -0.012045860290527344, -0.011228561401367188, -0.010411262512207031, -0.009593963623046875, -0.008776664733886719, -0.007959365844726562, -0.007142066955566406, -0.00632476806640625, -0.005507469177246094, -0.0046901702880859375, -0.0038728713989257812, -0.003055572509765625, -0.0022382736206054688, -0.0014209747314453125, -0.0006036758422851562, 0.000213623046875, 0.0010309219360351562, 0.0018482208251953125, 0.0026655197143554688, 0.003482818603515625, 0.004300117492675781, 0.0051174163818359375, 0.005934715270996094, 0.00675201416015625, 0.007569313049316406, 0.008386611938476562, 0.009203910827636719, 0.010021209716796875, 0.010838508605957031, 0.011655807495117188, 0.012473106384277344, 0.0132904052734375, 0.014107704162597656, 0.014925003051757812, 0.01574230194091797, 0.016559600830078125, 0.01737689971923828, 0.018194198608398438, 0.019011497497558594, 0.01982879638671875, 0.020646095275878906, 0.021463394165039062, 0.02228069305419922, 0.023097991943359375, 0.02391529083251953, 0.024732589721679688, 0.025549888610839844, 0.0263671875]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 16.0, 52.0, 171.0, 314.0, 260.0, 140.0, 38.0, 11.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002372708171606064, -0.002318601356819272, -0.002264494774863124, -0.002210387960076332, -0.002156281378120184, -0.002102174563333392, -0.002048067981377244, -0.001993961166590452, -0.0019398544682189822, -0.0018857477698475122, -0.0018316410714760423, -0.0017775343731045723, -0.0017234275583177805, -0.0016693209763616323, -0.0016152141615748405, -0.0015611074632033706, -0.0015070007648319006, -0.0014528940664604306, -0.0013987873680889606, -0.0013446806697174907, -0.0012905739713460207, -0.001236467156559229, -0.001182360458187759, -0.001128253759816289, -0.001074147061444819, -0.001020040363073349, -0.000965933664701879, -0.0009118269081227481, -0.0008577202097512782, -0.0008036135113798082, -0.0007495067548006773, -0.0006954000564292073, -0.0006412932416424155, -0.0005871865432709455, -0.0005330798448994756, -0.0004789730883203447, -0.0004248663899488747, -0.00037075969157740474, -0.0003166529641021043, -0.0002625462366268039, -0.0002084395382553339, -0.0001543328253319487, -0.0001002261124085635, -4.611939948517829e-05, 7.987313438206911e-06, 6.209401180967689e-05, 0.00011620073928497732, 0.00017030746676027775, 0.00022441416513174772, 0.0002785208635032177, 0.00033262759097851813, 0.00038673431845381856, 0.00044084101682528853, 0.0004949477151967585, 0.0005490544717758894, 0.0006031611701473594, 0.0006572678685188293, 0.0007113745668902993, 0.0007654812652617693, 0.0008195880218409002, 0.0008736947202123702, 0.0009278014185838401, 0.000981908175162971, 0.001036014873534441, 0.001090121571905911]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 11.0, 7.0, 11.0, 14.0, 10.0, 8.0, 8.0, 14.0, 23.0, 21.0, 23.0, 43.0, 28.0, 39.0, 34.0, 42.0, 41.0, 42.0, 46.0, 49.0, 60.0, 39.0, 41.0, 29.0, 33.0, 47.0, 30.0, 31.0, 28.0, 27.0, 29.0, 13.0, 16.0, 15.0, 11.0, 13.0, 9.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0006471872329711914, -0.0006230361759662628, -0.0005988851189613342, -0.0005747340619564056, -0.000550583004951477, -0.0005264319479465485, -0.0005022808909416199, -0.0004781298339366913, -0.0004539787769317627, -0.0004298277199268341, -0.0004056766629219055, -0.00038152560591697693, -0.00035737454891204834, -0.00033322349190711975, -0.00030907243490219116, -0.0002849213778972626, -0.000260770320892334, -0.0002366192638874054, -0.0002124682068824768, -0.00018831714987754822, -0.00016416609287261963, -0.00014001503586769104, -0.00011586397886276245, -9.171292185783386e-05, -6.756186485290527e-05, -4.3410807847976685e-05, -1.9259750843048096e-05, 4.891306161880493e-06, 2.9042363166809082e-05, 5.319342017173767e-05, 7.734447717666626e-05, 0.00010149553418159485, 0.00012564659118652344, 0.00014979764819145203, 0.00017394870519638062, 0.0001980997622013092, 0.0002222508192062378, 0.0002464018762111664, 0.00027055293321609497, 0.00029470399022102356, 0.00031885504722595215, 0.00034300610423088074, 0.0003671571612358093, 0.0003913082182407379, 0.0004154592752456665, 0.0004396103322505951, 0.0004637613892555237, 0.00048791244626045227, 0.0005120635032653809, 0.0005362145602703094, 0.000560365617275238, 0.0005845166742801666, 0.0006086677312850952, 0.0006328187882900238, 0.0006569698452949524, 0.000681120902299881, 0.0007052719593048096, 0.0007294230163097382, 0.0007535740733146667, 0.0007777251303195953, 0.0008018761873245239, 0.0008260272443294525, 0.0008501783013343811, 0.0008743293583393097, 0.0008984804153442383]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 8.0, 6.0, 11.0, 9.0, 16.0, 14.0, 19.0, 17.0, 22.0, 26.0, 20.0, 23.0, 37.0, 29.0, 40.0, 33.0, 33.0, 28.0, 29.0, 23.0, 37.0, 38.0, 54.0, 32.0, 32.0, 33.0, 35.0, 24.0, 33.0, 30.0, 27.0, 29.0, 24.0, 23.0, 23.0, 12.0, 10.0, 17.0, 9.0, 9.0, 8.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6953125, -8.4219970703125, -8.148681640625, -7.8753662109375, -7.60205078125, -7.3287353515625, -7.055419921875, -6.7821044921875, -6.5087890625, -6.2354736328125, -5.962158203125, -5.6888427734375, -5.41552734375, -5.1422119140625, -4.868896484375, -4.5955810546875, -4.322265625, -4.0489501953125, -3.775634765625, -3.5023193359375, -3.22900390625, -2.9556884765625, -2.682373046875, -2.4090576171875, -2.1357421875, -1.8624267578125, -1.589111328125, -1.3157958984375, -1.04248046875, -0.7691650390625, -0.495849609375, -0.2225341796875, 0.05078125, 0.3240966796875, 0.597412109375, 0.8707275390625, 1.14404296875, 1.4173583984375, 1.690673828125, 1.9639892578125, 2.2373046875, 2.5106201171875, 2.783935546875, 3.0572509765625, 3.33056640625, 3.6038818359375, 3.877197265625, 4.1505126953125, 4.423828125, 4.6971435546875, 4.970458984375, 5.2437744140625, 5.51708984375, 5.7904052734375, 6.063720703125, 6.3370361328125, 6.6103515625, 6.8836669921875, 7.156982421875, 7.4302978515625, 7.70361328125, 7.9769287109375, 8.250244140625, 8.5235595703125, 8.796875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 8.0, 9.0, 10.0, 20.0, 22.0, 21.0, 48.0, 57.0, 76.0, 90.0, 135.0, 189.0, 224.0, 294.0, 352.0, 505.0, 630.0, 729.0, 897.0, 1277.0, 2165.0, 4720.0, 15270.0, 67844.0, 313263.0, 475039.0, 122775.0, 25831.0, 7041.0, 2795.0, 1466.0, 1057.0, 754.0, 639.0, 558.0, 399.0, 336.0, 263.0, 176.0, 153.0, 108.0, 84.0, 75.0, 44.0, 27.0, 23.0, 19.0, 14.0, 10.0, 10.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.484375, -13.0654296875, -12.646484375, -12.2275390625, -11.80859375, -11.3896484375, -10.970703125, -10.5517578125, -10.1328125, -9.7138671875, -9.294921875, -8.8759765625, -8.45703125, -8.0380859375, -7.619140625, -7.2001953125, -6.78125, -6.3623046875, -5.943359375, -5.5244140625, -5.10546875, -4.6865234375, -4.267578125, -3.8486328125, -3.4296875, -3.0107421875, -2.591796875, -2.1728515625, -1.75390625, -1.3349609375, -0.916015625, -0.4970703125, -0.078125, 0.3408203125, 0.759765625, 1.1787109375, 1.59765625, 2.0166015625, 2.435546875, 2.8544921875, 3.2734375, 3.6923828125, 4.111328125, 4.5302734375, 4.94921875, 5.3681640625, 5.787109375, 6.2060546875, 6.625, 7.0439453125, 7.462890625, 7.8818359375, 8.30078125, 8.7197265625, 9.138671875, 9.5576171875, 9.9765625, 10.3955078125, 10.814453125, 11.2333984375, 11.65234375, 12.0712890625, 12.490234375, 12.9091796875, 13.328125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 0.0, 4.0, 7.0, 11.0, 15.0, 15.0, 8.0, 20.0, 14.0, 15.0, 42.0, 53.0, 67.0, 72.0, 101.0, 175.0, 1544.0, 341.0, 147.0, 91.0, 59.0, 50.0, 42.0, 42.0, 18.0, 25.0, 13.0, 17.0, 18.0, 3.0, 9.0, 9.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.703125, -21.666259765625, -20.62939453125, -19.592529296875, -18.5556640625, -17.518798828125, -16.48193359375, -15.445068359375, -14.408203125, -13.371337890625, -12.33447265625, -11.297607421875, -10.2607421875, -9.223876953125, -8.18701171875, -7.150146484375, -6.11328125, -5.076416015625, -4.03955078125, -3.002685546875, -1.9658203125, -0.928955078125, 0.10791015625, 1.144775390625, 2.181640625, 3.218505859375, 4.25537109375, 5.292236328125, 6.3291015625, 7.365966796875, 8.40283203125, 9.439697265625, 10.4765625, 11.513427734375, 12.55029296875, 13.587158203125, 14.6240234375, 15.660888671875, 16.69775390625, 17.734619140625, 18.771484375, 19.808349609375, 20.84521484375, 21.882080078125, 22.9189453125, 23.955810546875, 24.99267578125, 26.029541015625, 27.06640625, 28.103271484375, 29.14013671875, 30.177001953125, 31.2138671875, 32.250732421875, 33.28759765625, 34.324462890625, 35.361328125, 36.398193359375, 37.43505859375, 38.471923828125, 39.5087890625, 40.545654296875, 41.58251953125, 42.619384765625, 43.65625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 8.0, 5.0, 9.0, 9.0, 12.0, 26.0, 23.0, 31.0, 42.0, 47.0, 69.0, 128.0, 186.0, 326.0, 703.0, 2264.0, 3071718.0, 67370.0, 1328.0, 550.0, 288.0, 181.0, 96.0, 58.0, 48.0, 54.0, 31.0, 23.0, 18.0, 18.0, 9.0, 5.0, 7.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-102.8125, -100.01953125, -97.2265625, -94.43359375, -91.640625, -88.84765625, -86.0546875, -83.26171875, -80.46875, -77.67578125, -74.8828125, -72.08984375, -69.296875, -66.50390625, -63.7109375, -60.91796875, -58.125, -55.33203125, -52.5390625, -49.74609375, -46.953125, -44.16015625, -41.3671875, -38.57421875, -35.78125, -32.98828125, -30.1953125, -27.40234375, -24.609375, -21.81640625, -19.0234375, -16.23046875, -13.4375, -10.64453125, -7.8515625, -5.05859375, -2.265625, 0.52734375, 3.3203125, 6.11328125, 8.90625, 11.69921875, 14.4921875, 17.28515625, 20.078125, 22.87109375, 25.6640625, 28.45703125, 31.25, 34.04296875, 36.8359375, 39.62890625, 42.421875, 45.21484375, 48.0078125, 50.80078125, 53.59375, 56.38671875, 59.1796875, 61.97265625, 64.765625, 67.55859375, 70.3515625, 73.14453125, 75.9375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 10.0, 137.0, 670.0, 182.0, 17.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.9072494506836, -96.4040298461914, -90.90081787109375, -85.39759826660156, -79.89437866210938, -74.39115905761719, -68.887939453125, -63.384727478027344, -57.881507873535156, -52.37828826904297, -46.87507247924805, -41.371856689453125, -35.86863708496094, -30.365419387817383, -24.862201690673828, -19.358985900878906, -13.855766296386719, -8.352548599243164, -2.8493309020996094, 2.6538867950439453, 8.1571044921875, 13.660322189331055, 19.16353988647461, 24.66675567626953, 30.16997528076172, 35.673194885253906, 41.17641067504883, 46.67962646484375, 52.18284606933594, 57.686065673828125, 63.18928146362305, 68.69249725341797, 74.19572448730469, 79.69894409179688, 85.20216369628906, 90.70537567138672, 96.2085952758789, 101.7118148803711, 107.21502685546875, 112.71824645996094, 118.22146606445312, 123.72468566894531, 129.2279052734375, 134.7311248779297, 140.23434448242188, 145.737548828125, 151.2407684326172, 156.74398803710938, 162.24720764160156, 167.75042724609375, 173.25364685058594, 178.75686645507812, 184.26007080078125, 189.76329040527344, 195.26651000976562, 200.7697296142578, 206.27294921875, 211.7761688232422, 217.27938842773438, 222.78260803222656, 228.28582763671875, 233.78903198242188, 239.29225158691406, 244.79547119140625, 250.29869079589844]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 7.0, 7.0, 9.0, 12.0, 11.0, 15.0, 14.0, 16.0, 24.0, 24.0, 32.0, 25.0, 36.0, 45.0, 35.0, 34.0, 33.0, 41.0, 40.0, 40.0, 38.0, 49.0, 44.0, 43.0, 43.0, 24.0, 35.0, 40.0, 25.0, 22.0, 23.0, 18.0, 13.0, 23.0, 11.0, 6.0, 9.0, 7.0, 8.0, 6.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.33706665039062, -65.08644104003906, -62.8358154296875, -60.58518981933594, -58.334564208984375, -56.08393859863281, -53.83331298828125, -51.58268737792969, -49.332061767578125, -47.08143615722656, -44.830810546875, -42.58018493652344, -40.329559326171875, -38.07893371582031, -35.82830810546875, -33.57768249511719, -31.32705307006836, -29.076427459716797, -26.825801849365234, -24.575176239013672, -22.32455062866211, -20.073925018310547, -17.82329750061035, -15.572671890258789, -13.322046279907227, -11.071420669555664, -8.820795059204102, -6.570168495178223, -4.31954288482666, -2.0689172744750977, 0.18170928955078125, 2.4323348999023438, 4.682960510253906, 6.933586120605469, 9.184211730957031, 11.43483829498291, 13.685463905334473, 15.936089515686035, 18.186716079711914, 20.437341690063477, 22.68796730041504, 24.9385929107666, 27.189218521118164, 29.43984603881836, 31.690471649169922, 33.941097259521484, 36.19172286987305, 38.44234848022461, 40.69297409057617, 42.943599700927734, 45.1942253112793, 47.44485092163086, 49.69547653198242, 51.946102142333984, 54.19673156738281, 56.447357177734375, 58.69798278808594, 60.9486083984375, 63.19923400878906, 65.44985961914062, 67.70048522949219, 69.95111083984375, 72.20173645019531, 74.45236206054688, 76.70298767089844]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 9.0, 4.0, 6.0, 17.0, 10.0, 12.0, 19.0, 16.0, 12.0, 19.0, 20.0, 28.0, 28.0, 22.0, 29.0, 32.0, 33.0, 24.0, 38.0, 29.0, 40.0, 26.0, 25.0, 27.0, 43.0, 34.0, 31.0, 34.0, 26.0, 35.0, 42.0, 26.0, 23.0, 16.0, 27.0, 14.0, 11.0, 18.0, 20.0, 18.0, 6.0, 7.0, 7.0, 12.0, 4.0, 4.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.73828125, -7.49200439453125, -7.2457275390625, -6.99945068359375, -6.753173828125, -6.50689697265625, -6.2606201171875, -6.01434326171875, -5.76806640625, -5.52178955078125, -5.2755126953125, -5.02923583984375, -4.782958984375, -4.53668212890625, -4.2904052734375, -4.04412841796875, -3.7978515625, -3.55157470703125, -3.3052978515625, -3.05902099609375, -2.812744140625, -2.56646728515625, -2.3201904296875, -2.07391357421875, -1.82763671875, -1.58135986328125, -1.3350830078125, -1.08880615234375, -0.842529296875, -0.59625244140625, -0.3499755859375, -0.10369873046875, 0.142578125, 0.38885498046875, 0.6351318359375, 0.88140869140625, 1.127685546875, 1.37396240234375, 1.6202392578125, 1.86651611328125, 2.11279296875, 2.35906982421875, 2.6053466796875, 2.85162353515625, 3.097900390625, 3.34417724609375, 3.5904541015625, 3.83673095703125, 4.0830078125, 4.32928466796875, 4.5755615234375, 4.82183837890625, 5.068115234375, 5.31439208984375, 5.5606689453125, 5.80694580078125, 6.05322265625, 6.29949951171875, 6.5457763671875, 6.79205322265625, 7.038330078125, 7.28460693359375, 7.5308837890625, 7.77716064453125, 8.0234375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 8.0, 11.0, 7.0, 13.0, 17.0, 21.0, 22.0, 36.0, 32.0, 60.0, 59.0, 87.0, 105.0, 173.0, 225.0, 432.0, 829.0, 2899.0, 18115.0, 446927.0, 3179999.0, 518746.0, 20174.0, 3120.0, 876.0, 382.0, 204.0, 160.0, 98.0, 105.0, 62.0, 65.0, 37.0, 43.0, 30.0, 17.0, 18.0, 18.0, 8.0, 8.0, 9.0, 6.0, 5.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-28.5625, -27.735107421875, -26.90771484375, -26.080322265625, -25.2529296875, -24.425537109375, -23.59814453125, -22.770751953125, -21.943359375, -21.115966796875, -20.28857421875, -19.461181640625, -18.6337890625, -17.806396484375, -16.97900390625, -16.151611328125, -15.32421875, -14.496826171875, -13.66943359375, -12.842041015625, -12.0146484375, -11.187255859375, -10.35986328125, -9.532470703125, -8.705078125, -7.877685546875, -7.05029296875, -6.222900390625, -5.3955078125, -4.568115234375, -3.74072265625, -2.913330078125, -2.0859375, -1.258544921875, -0.43115234375, 0.396240234375, 1.2236328125, 2.051025390625, 2.87841796875, 3.705810546875, 4.533203125, 5.360595703125, 6.18798828125, 7.015380859375, 7.8427734375, 8.670166015625, 9.49755859375, 10.324951171875, 11.15234375, 11.979736328125, 12.80712890625, 13.634521484375, 14.4619140625, 15.289306640625, 16.11669921875, 16.944091796875, 17.771484375, 18.598876953125, 19.42626953125, 20.253662109375, 21.0810546875, 21.908447265625, 22.73583984375, 23.563232421875, 24.390625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 11.0, 18.0, 22.0, 24.0, 44.0, 61.0, 94.0, 112.0, 186.0, 240.0, 370.0, 521.0, 599.0, 513.0, 367.0, 249.0, 172.0, 130.0, 86.0, 68.0, 45.0, 34.0, 19.0, 25.0, 9.0, 10.0, 4.0, 4.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3203125, -14.7615966796875, -14.202880859375, -13.6441650390625, -13.08544921875, -12.5267333984375, -11.968017578125, -11.4093017578125, -10.8505859375, -10.2918701171875, -9.733154296875, -9.1744384765625, -8.61572265625, -8.0570068359375, -7.498291015625, -6.9395751953125, -6.380859375, -5.8221435546875, -5.263427734375, -4.7047119140625, -4.14599609375, -3.5872802734375, -3.028564453125, -2.4698486328125, -1.9111328125, -1.3524169921875, -0.793701171875, -0.2349853515625, 0.32373046875, 0.8824462890625, 1.441162109375, 1.9998779296875, 2.55859375, 3.1173095703125, 3.676025390625, 4.2347412109375, 4.79345703125, 5.3521728515625, 5.910888671875, 6.4696044921875, 7.0283203125, 7.5870361328125, 8.145751953125, 8.7044677734375, 9.26318359375, 9.8218994140625, 10.380615234375, 10.9393310546875, 11.498046875, 12.0567626953125, 12.615478515625, 13.1741943359375, 13.73291015625, 14.2916259765625, 14.850341796875, 15.4090576171875, 15.9677734375, 16.5264892578125, 17.085205078125, 17.6439208984375, 18.20263671875, 18.7613525390625, 19.320068359375, 19.8787841796875, 20.4375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 12.0, 18.0, 51.0, 86.0, 186.0, 546.0, 3335.0, 3257835.0, 929024.0, 2398.0, 467.0, 171.0, 65.0, 45.0, 20.0, 7.0, 3.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.375, -110.38671875, -107.3984375, -104.41015625, -101.421875, -98.43359375, -95.4453125, -92.45703125, -89.46875, -86.48046875, -83.4921875, -80.50390625, -77.515625, -74.52734375, -71.5390625, -68.55078125, -65.5625, -62.57421875, -59.5859375, -56.59765625, -53.609375, -50.62109375, -47.6328125, -44.64453125, -41.65625, -38.66796875, -35.6796875, -32.69140625, -29.703125, -26.71484375, -23.7265625, -20.73828125, -17.75, -14.76171875, -11.7734375, -8.78515625, -5.796875, -2.80859375, 0.1796875, 3.16796875, 6.15625, 9.14453125, 12.1328125, 15.12109375, 18.109375, 21.09765625, 24.0859375, 27.07421875, 30.0625, 33.05078125, 36.0390625, 39.02734375, 42.015625, 45.00390625, 47.9921875, 50.98046875, 53.96875, 56.95703125, 59.9453125, 62.93359375, 65.921875, 68.91015625, 71.8984375, 74.88671875, 77.875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 33.0, 359.0, 550.0, 66.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-272.96270751953125, -262.5291748046875, -252.09564208984375, -241.66209411621094, -231.2285614013672, -220.79502868652344, -210.36148071289062, -199.92794799804688, -189.49441528320312, -179.06088256835938, -168.62734985351562, -158.1938018798828, -147.76026916503906, -137.3267364501953, -126.89319610595703, -116.45965576171875, -106.026123046875, -95.59259033203125, -85.15904998779297, -74.72550964355469, -64.29197692871094, -53.85844039916992, -43.424903869628906, -32.991363525390625, -22.557830810546875, -12.12429428100586, -1.6907577514648438, 8.742778778076172, 19.176315307617188, 29.609851837158203, 40.04338836669922, 50.4769287109375, 60.910491943359375, 71.34402465820312, 81.7775650024414, 92.21110534667969, 102.64463806152344, 113.07817077636719, 123.51171112060547, 133.94525146484375, 144.3787841796875, 154.81231689453125, 165.245849609375, 175.6793975830078, 186.11293029785156, 196.5464630126953, 206.98001098632812, 217.41354370117188, 227.84707641601562, 238.28060913085938, 248.71414184570312, 259.1476745605469, 269.58123779296875, 280.0147705078125, 290.44830322265625, 300.8818359375, 311.31536865234375, 321.7489013671875, 332.18243408203125, 342.615966796875, 353.04949951171875, 363.4830627441406, 373.9165954589844, 384.3501281738281, 394.7836608886719]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 4.0, 12.0, 8.0, 10.0, 13.0, 11.0, 15.0, 14.0, 21.0, 33.0, 14.0, 30.0, 28.0, 39.0, 29.0, 54.0, 26.0, 45.0, 41.0, 41.0, 36.0, 44.0, 45.0, 47.0, 34.0, 35.0, 34.0, 40.0, 22.0, 21.0, 19.0, 18.0, 22.0, 22.0, 13.0, 9.0, 10.0, 5.0, 5.0, 8.0, 6.0, 2.0, 6.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-63.64501953125, -61.79553985595703, -59.94606018066406, -58.096580505371094, -56.247100830078125, -54.397621154785156, -52.54814147949219, -50.69866180419922, -48.84918212890625, -46.99970245361328, -45.15022277832031, -43.300743103027344, -41.451263427734375, -39.601783752441406, -37.75230407714844, -35.90282440185547, -34.0533447265625, -32.20386505126953, -30.354385375976562, -28.504905700683594, -26.655426025390625, -24.805946350097656, -22.956466674804688, -21.10698699951172, -19.25750732421875, -17.40802764892578, -15.558547973632812, -13.709068298339844, -11.859588623046875, -10.010108947753906, -8.160629272460938, -6.311149597167969, -4.461669921875, -2.6121902465820312, -0.7627105712890625, 1.0867691040039062, 2.936248779296875, 4.785728454589844, 6.6352081298828125, 8.484687805175781, 10.33416748046875, 12.183647155761719, 14.033126831054688, 15.882606506347656, 17.732086181640625, 19.581565856933594, 21.431045532226562, 23.28052520751953, 25.1300048828125, 26.97948455810547, 28.828964233398438, 30.678443908691406, 32.527923583984375, 34.377403259277344, 36.22688293457031, 38.07636260986328, 39.92584228515625, 41.77532196044922, 43.62480163574219, 45.474281311035156, 47.323760986328125, 49.173240661621094, 51.02272033691406, 52.87220001220703, 54.7216796875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 9.0, 5.0, 12.0, 14.0, 14.0, 19.0, 18.0, 21.0, 27.0, 31.0, 32.0, 29.0, 36.0, 31.0, 32.0, 30.0, 39.0, 45.0, 54.0, 45.0, 34.0, 33.0, 35.0, 31.0, 30.0, 36.0, 32.0, 24.0, 22.0, 21.0, 24.0, 24.0, 18.0, 12.0, 12.0, 12.0, 11.0, 9.0, 4.0, 5.0, 0.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-7.69140625, -7.4698486328125, -7.248291015625, -7.0267333984375, -6.80517578125, -6.5836181640625, -6.362060546875, -6.1405029296875, -5.9189453125, -5.6973876953125, -5.475830078125, -5.2542724609375, -5.03271484375, -4.8111572265625, -4.589599609375, -4.3680419921875, -4.146484375, -3.9249267578125, -3.703369140625, -3.4818115234375, -3.26025390625, -3.0386962890625, -2.817138671875, -2.5955810546875, -2.3740234375, -2.1524658203125, -1.930908203125, -1.7093505859375, -1.48779296875, -1.2662353515625, -1.044677734375, -0.8231201171875, -0.6015625, -0.3800048828125, -0.158447265625, 0.0631103515625, 0.28466796875, 0.5062255859375, 0.727783203125, 0.9493408203125, 1.1708984375, 1.3924560546875, 1.614013671875, 1.8355712890625, 2.05712890625, 2.2786865234375, 2.500244140625, 2.7218017578125, 2.943359375, 3.1649169921875, 3.386474609375, 3.6080322265625, 3.82958984375, 4.0511474609375, 4.272705078125, 4.4942626953125, 4.7158203125, 4.9373779296875, 5.158935546875, 5.3804931640625, 5.60205078125, 5.8236083984375, 6.045166015625, 6.2667236328125, 6.48828125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 14.0, 15.0, 21.0, 32.0, 52.0, 65.0, 99.0, 146.0, 263.0, 379.0, 596.0, 896.0, 1294.0, 2061.0, 3301.0, 5010.0, 7832.0, 12280.0, 19368.0, 31872.0, 52196.0, 91297.0, 192785.0, 319773.0, 128193.0, 69182.0, 41016.0, 25098.0, 15557.0, 10024.0, 6308.0, 4028.0, 2624.0, 1695.0, 1105.0, 736.0, 438.0, 305.0, 197.0, 143.0, 90.0, 61.0, 40.0, 19.0, 16.0, 11.0, 8.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0], "bins": [-1.671875, -1.623077392578125, -1.57427978515625, -1.525482177734375, -1.4766845703125, -1.427886962890625, -1.37908935546875, -1.330291748046875, -1.281494140625, -1.232696533203125, -1.18389892578125, -1.135101318359375, -1.0863037109375, -1.037506103515625, -0.98870849609375, -0.939910888671875, -0.89111328125, -0.842315673828125, -0.79351806640625, -0.744720458984375, -0.6959228515625, -0.647125244140625, -0.59832763671875, -0.549530029296875, -0.500732421875, -0.451934814453125, -0.40313720703125, -0.354339599609375, -0.3055419921875, -0.256744384765625, -0.20794677734375, -0.159149169921875, -0.1103515625, -0.061553955078125, -0.01275634765625, 0.036041259765625, 0.0848388671875, 0.133636474609375, 0.18243408203125, 0.231231689453125, 0.280029296875, 0.328826904296875, 0.37762451171875, 0.426422119140625, 0.4752197265625, 0.524017333984375, 0.57281494140625, 0.621612548828125, 0.67041015625, 0.719207763671875, 0.76800537109375, 0.816802978515625, 0.8656005859375, 0.914398193359375, 0.96319580078125, 1.011993408203125, 1.060791015625, 1.109588623046875, 1.15838623046875, 1.207183837890625, 1.2559814453125, 1.304779052734375, 1.35357666015625, 1.402374267578125, 1.451171875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 5.0, 5.0, 5.0, 3.0, 7.0, 5.0, 4.0, 6.0, 9.0, 14.0, 15.0, 14.0, 23.0, 17.0, 34.0, 21.0, 36.0, 35.0, 38.0, 46.0, 41.0, 37.0, 43.0, 50.0, 1059.0, 33.0, 31.0, 38.0, 35.0, 23.0, 35.0, 28.0, 27.0, 25.0, 34.0, 21.0, 24.0, 19.0, 13.0, 20.0, 9.0, 14.0, 5.0, 10.0, 6.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.5078125, -4.361328125, -4.21484375, -4.068359375, -3.921875, -3.775390625, -3.62890625, -3.482421875, -3.3359375, -3.189453125, -3.04296875, -2.896484375, -2.75, -2.603515625, -2.45703125, -2.310546875, -2.1640625, -2.017578125, -1.87109375, -1.724609375, -1.578125, -1.431640625, -1.28515625, -1.138671875, -0.9921875, -0.845703125, -0.69921875, -0.552734375, -0.40625, -0.259765625, -0.11328125, 0.033203125, 0.1796875, 0.326171875, 0.47265625, 0.619140625, 0.765625, 0.912109375, 1.05859375, 1.205078125, 1.3515625, 1.498046875, 1.64453125, 1.791015625, 1.9375, 2.083984375, 2.23046875, 2.376953125, 2.5234375, 2.669921875, 2.81640625, 2.962890625, 3.109375, 3.255859375, 3.40234375, 3.548828125, 3.6953125, 3.841796875, 3.98828125, 4.134765625, 4.28125, 4.427734375, 4.57421875, 4.720703125, 4.8671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 7.0, 13.0, 11.0, 21.0, 32.0, 51.0, 80.0, 145.0, 261.0, 443.0, 756.0, 1284.0, 2292.0, 4375.0, 8376.0, 15896.0, 32209.0, 67945.0, 160534.0, 1488190.0, 172804.0, 71685.0, 33811.0, 17024.0, 8629.0, 4580.0, 2472.0, 1388.0, 723.0, 445.0, 246.0, 159.0, 85.0, 52.0, 29.0, 23.0, 8.0, 7.0, 5.0, 8.0, 3.0, 6.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-2.408203125, -2.336395263671875, -2.26458740234375, -2.192779541015625, -2.1209716796875, -2.049163818359375, -1.97735595703125, -1.905548095703125, -1.833740234375, -1.761932373046875, -1.69012451171875, -1.618316650390625, -1.5465087890625, -1.474700927734375, -1.40289306640625, -1.331085205078125, -1.25927734375, -1.187469482421875, -1.11566162109375, -1.043853759765625, -0.9720458984375, -0.900238037109375, -0.82843017578125, -0.756622314453125, -0.684814453125, -0.613006591796875, -0.54119873046875, -0.469390869140625, -0.3975830078125, -0.325775146484375, -0.25396728515625, -0.182159423828125, -0.1103515625, -0.038543701171875, 0.03326416015625, 0.105072021484375, 0.1768798828125, 0.248687744140625, 0.32049560546875, 0.392303466796875, 0.464111328125, 0.535919189453125, 0.60772705078125, 0.679534912109375, 0.7513427734375, 0.823150634765625, 0.89495849609375, 0.966766357421875, 1.03857421875, 1.110382080078125, 1.18218994140625, 1.253997802734375, 1.3258056640625, 1.397613525390625, 1.46942138671875, 1.541229248046875, 1.613037109375, 1.684844970703125, 1.75665283203125, 1.828460693359375, 1.9002685546875, 1.972076416015625, 2.04388427734375, 2.115692138671875, 2.1875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 0.0, 6.0, 5.0, 5.0, 6.0, 10.0, 12.0, 12.0, 18.0, 28.0, 32.0, 42.0, 48.0, 74.0, 78.0, 102.0, 79.0, 94.0, 69.0, 61.0, 41.0, 37.0, 30.0, 29.0, 16.0, 16.0, 5.0, 11.0, 10.0, 6.0, 8.0, 4.0, 1.0, 0.0, 4.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0012731552124023438, -0.0012359768152236938, -0.001198798418045044, -0.001161620020866394, -0.0011244416236877441, -0.0010872632265090942, -0.0010500848293304443, -0.0010129064321517944, -0.0009757280349731445, -0.0009385496377944946, -0.0009013712406158447, -0.0008641928434371948, -0.0008270144462585449, -0.000789836049079895, -0.0007526576519012451, -0.0007154792547225952, -0.0006783008575439453, -0.0006411224603652954, -0.0006039440631866455, -0.0005667656660079956, -0.0005295872688293457, -0.0004924088716506958, -0.0004552304744720459, -0.000418052077293396, -0.0003808736801147461, -0.0003436952829360962, -0.0003065168857574463, -0.0002693384885787964, -0.00023216009140014648, -0.00019498169422149658, -0.00015780329704284668, -0.00012062489986419678, -8.344650268554688e-05, -4.626810550689697e-05, -9.08970832824707e-06, 2.8088688850402832e-05, 6.526708602905273e-05, 0.00010244548320770264, 0.00013962388038635254, 0.00017680227756500244, 0.00021398067474365234, 0.00025115907192230225, 0.00028833746910095215, 0.00032551586627960205, 0.00036269426345825195, 0.00039987266063690186, 0.00043705105781555176, 0.00047422945499420166, 0.0005114078521728516, 0.0005485862493515015, 0.0005857646465301514, 0.0006229430437088013, 0.0006601214408874512, 0.0006972998380661011, 0.000734478235244751, 0.0007716566324234009, 0.0008088350296020508, 0.0008460134267807007, 0.0008831918239593506, 0.0009203702211380005, 0.0009575486183166504, 0.0009947270154953003, 0.0010319054126739502, 0.0010690838098526, 0.00110626220703125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 5.0, 8.0, 5.0, 6.0, 5.0, 14.0, 11.0, 13.0, 19.0, 25.0, 39.0, 45.0, 55.0, 78.0, 111.0, 155.0, 232.0, 358.0, 678.0, 2808.0, 1010934.0, 30694.0, 911.0, 452.0, 258.0, 170.0, 139.0, 92.0, 60.0, 34.0, 34.0, 18.0, 20.0, 16.0, 11.0, 11.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.018524169921875, -0.017900466918945312, -0.017276763916015625, -0.016653060913085938, -0.01602935791015625, -0.015405654907226562, -0.014781951904296875, -0.014158248901367188, -0.0135345458984375, -0.012910842895507812, -0.012287139892578125, -0.011663436889648438, -0.01103973388671875, -0.010416030883789062, -0.009792327880859375, -0.009168624877929688, -0.008544921875, -0.007921218872070312, -0.007297515869140625, -0.0066738128662109375, -0.00605010986328125, -0.0054264068603515625, -0.004802703857421875, -0.0041790008544921875, -0.0035552978515625, -0.0029315948486328125, -0.002307891845703125, -0.0016841888427734375, -0.00106048583984375, -0.0004367828369140625, 0.000186920166015625, 0.0008106231689453125, 0.001434326171875, 0.0020580291748046875, 0.002681732177734375, 0.0033054351806640625, 0.00392913818359375, 0.0045528411865234375, 0.005176544189453125, 0.0058002471923828125, 0.0064239501953125, 0.0070476531982421875, 0.007671356201171875, 0.008295059204101562, 0.00891876220703125, 0.009542465209960938, 0.010166168212890625, 0.010789871215820312, 0.01141357421875, 0.012037277221679688, 0.012660980224609375, 0.013284683227539062, 0.01390838623046875, 0.014532089233398438, 0.015155792236328125, 0.015779495239257812, 0.0164031982421875, 0.017026901245117188, 0.017650604248046875, 0.018274307250976562, 0.01889801025390625, 0.019521713256835938, 0.020145416259765625, 0.020769119262695312, 0.021392822265625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 29.0, 63.0, 166.0, 268.0, 244.0, 146.0, 59.0, 25.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001402867492288351, -0.0013659041142091155, -0.00132894073612988, -0.0012919773580506444, -0.0012550139799714088, -0.0012180506018921733, -0.0011810872238129377, -0.0011441238457337022, -0.0011071604676544666, -0.001070197089575231, -0.0010332337114959955, -0.00099627033341676, -0.0009593069553375244, -0.0009223435772582889, -0.0008853801991790533, -0.0008484168210998178, -0.0008114534430205822, -0.0007744900649413466, -0.0007375266868621111, -0.0007005633087828755, -0.00066359993070364, -0.0006266365526244044, -0.0005896731745451689, -0.0005527097964659333, -0.0005157464183866978, -0.0004787830403074622, -0.00044181966222822666, -0.0004048562841489911, -0.00036789290606975555, -0.00033092952799052, -0.00029396614991128445, -0.0002570027718320489, -0.00022003945196047425, -0.0001830760738812387, -0.00014611269580200315, -0.00010914931772276759, -7.218593964353204e-05, -3.5222561564296484e-05, 1.7408165149390697e-06, 3.8704194594174623e-05, 7.566757267341018e-05, 0.00011263095075264573, 0.00014959432883188128, 0.00018655770691111684, 0.0002235210849903524, 0.00026048446306958795, 0.0002974478411488235, 0.00033441121922805905, 0.0003713745973072946, 0.00040833797538653016, 0.0004453013534657657, 0.00048226473154500127, 0.0005192281096242368, 0.0005561914877034724, 0.0005931548657827079, 0.0006301182438619435, 0.000667081621941179, 0.0007040450000204146, 0.0007410083780996501, 0.0007779717561788857, 0.0008149351342581213, 0.0008518985123373568, 0.0008888618904165924, 0.0009258252684958279, 0.0009627886465750635]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 7.0, 8.0, 8.0, 11.0, 13.0, 15.0, 11.0, 23.0, 20.0, 18.0, 21.0, 20.0, 25.0, 33.0, 37.0, 35.0, 26.0, 41.0, 44.0, 48.0, 26.0, 31.0, 49.0, 37.0, 38.0, 45.0, 30.0, 43.0, 27.0, 32.0, 25.0, 20.0, 24.0, 24.0, 16.0, 13.0, 7.0, 11.0, 5.0, 8.0, 10.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00043141841888427734, -0.00041608046740293503, -0.0004007425159215927, -0.0003854045644402504, -0.0003700666129589081, -0.00035472866147756577, -0.00033939070999622345, -0.00032405275851488113, -0.0003087148070335388, -0.0002933768555521965, -0.0002780389040708542, -0.00026270095258951187, -0.00024736300110816956, -0.00023202504962682724, -0.00021668709814548492, -0.0002013491466641426, -0.0001860111951828003, -0.00017067324370145798, -0.00015533529222011566, -0.00013999734073877335, -0.00012465938925743103, -0.00010932143777608871, -9.39834862947464e-05, -7.864553481340408e-05, -6.330758333206177e-05, -4.796963185071945e-05, -3.2631680369377136e-05, -1.729372888803482e-05, -1.955777406692505e-06, 1.338217407464981e-05, 2.8720125555992126e-05, 4.405807703733444e-05, 5.939602851867676e-05, 7.473398000001907e-05, 9.007193148136139e-05, 0.0001054098829627037, 0.00012074783444404602, 0.00013608578592538834, 0.00015142373740673065, 0.00016676168888807297, 0.00018209964036941528, 0.0001974375918507576, 0.00021277554333209991, 0.00022811349481344223, 0.00024345144629478455, 0.00025878939777612686, 0.0002741273492574692, 0.0002894653007388115, 0.0003048032522201538, 0.0003201412037014961, 0.00033547915518283844, 0.00035081710666418076, 0.00036615505814552307, 0.0003814930096268654, 0.0003968309611082077, 0.00041216891258955, 0.00042750686407089233, 0.00044284481555223465, 0.00045818276703357697, 0.0004735207185149193, 0.0004888586699962616, 0.0005041966214776039, 0.0005195345729589462, 0.0005348725244402885, 0.0005502104759216309]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 10.0, 9.0, 6.0, 11.0, 14.0, 14.0, 19.0, 18.0, 22.0, 28.0, 30.0, 31.0, 29.0, 36.0, 32.0, 31.0, 30.0, 39.0, 46.0, 54.0, 44.0, 34.0, 33.0, 35.0, 31.0, 31.0, 35.0, 33.0, 23.0, 23.0, 20.0, 24.0, 24.0, 18.0, 12.0, 12.0, 12.0, 11.0, 9.0, 4.0, 5.0, 0.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-7.6875, -7.46600341796875, -7.2445068359375, -7.02301025390625, -6.801513671875, -6.58001708984375, -6.3585205078125, -6.13702392578125, -5.91552734375, -5.69403076171875, -5.4725341796875, -5.25103759765625, -5.029541015625, -4.80804443359375, -4.5865478515625, -4.36505126953125, -4.1435546875, -3.92205810546875, -3.7005615234375, -3.47906494140625, -3.257568359375, -3.03607177734375, -2.8145751953125, -2.59307861328125, -2.37158203125, -2.15008544921875, -1.9285888671875, -1.70709228515625, -1.485595703125, -1.26409912109375, -1.0426025390625, -0.82110595703125, -0.599609375, -0.37811279296875, -0.1566162109375, 0.06488037109375, 0.286376953125, 0.50787353515625, 0.7293701171875, 0.95086669921875, 1.17236328125, 1.39385986328125, 1.6153564453125, 1.83685302734375, 2.058349609375, 2.27984619140625, 2.5013427734375, 2.72283935546875, 2.9443359375, 3.16583251953125, 3.3873291015625, 3.60882568359375, 3.830322265625, 4.05181884765625, 4.2733154296875, 4.49481201171875, 4.71630859375, 4.93780517578125, 5.1593017578125, 5.38079833984375, 5.602294921875, 5.82379150390625, 6.0452880859375, 6.26678466796875, 6.48828125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 5.0, 1.0, 5.0, 2.0, 5.0, 5.0, 11.0, 19.0, 17.0, 29.0, 55.0, 70.0, 70.0, 118.0, 145.0, 201.0, 290.0, 446.0, 609.0, 874.0, 1227.0, 1794.0, 3114.0, 6854.0, 31378.0, 294263.0, 615287.0, 69637.0, 11068.0, 3978.0, 2158.0, 1471.0, 986.0, 677.0, 466.0, 337.0, 250.0, 192.0, 136.0, 78.0, 61.0, 41.0, 37.0, 27.0, 19.0, 10.0, 16.0, 7.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.5625, -15.9951171875, -15.427734375, -14.8603515625, -14.29296875, -13.7255859375, -13.158203125, -12.5908203125, -12.0234375, -11.4560546875, -10.888671875, -10.3212890625, -9.75390625, -9.1865234375, -8.619140625, -8.0517578125, -7.484375, -6.9169921875, -6.349609375, -5.7822265625, -5.21484375, -4.6474609375, -4.080078125, -3.5126953125, -2.9453125, -2.3779296875, -1.810546875, -1.2431640625, -0.67578125, -0.1083984375, 0.458984375, 1.0263671875, 1.59375, 2.1611328125, 2.728515625, 3.2958984375, 3.86328125, 4.4306640625, 4.998046875, 5.5654296875, 6.1328125, 6.7001953125, 7.267578125, 7.8349609375, 8.40234375, 8.9697265625, 9.537109375, 10.1044921875, 10.671875, 11.2392578125, 11.806640625, 12.3740234375, 12.94140625, 13.5087890625, 14.076171875, 14.6435546875, 15.2109375, 15.7783203125, 16.345703125, 16.9130859375, 17.48046875, 18.0478515625, 18.615234375, 19.1826171875, 19.75]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 11.0, 7.0, 11.0, 13.0, 25.0, 22.0, 23.0, 33.0, 30.0, 35.0, 44.0, 50.0, 44.0, 58.0, 114.0, 1531.0, 530.0, 94.0, 56.0, 57.0, 47.0, 35.0, 30.0, 27.0, 21.0, 22.0, 16.0, 16.0, 10.0, 13.0, 6.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.09375, -19.423828125, -18.75390625, -18.083984375, -17.4140625, -16.744140625, -16.07421875, -15.404296875, -14.734375, -14.064453125, -13.39453125, -12.724609375, -12.0546875, -11.384765625, -10.71484375, -10.044921875, -9.375, -8.705078125, -8.03515625, -7.365234375, -6.6953125, -6.025390625, -5.35546875, -4.685546875, -4.015625, -3.345703125, -2.67578125, -2.005859375, -1.3359375, -0.666015625, 0.00390625, 0.673828125, 1.34375, 2.013671875, 2.68359375, 3.353515625, 4.0234375, 4.693359375, 5.36328125, 6.033203125, 6.703125, 7.373046875, 8.04296875, 8.712890625, 9.3828125, 10.052734375, 10.72265625, 11.392578125, 12.0625, 12.732421875, 13.40234375, 14.072265625, 14.7421875, 15.412109375, 16.08203125, 16.751953125, 17.421875, 18.091796875, 18.76171875, 19.431640625, 20.1015625, 20.771484375, 21.44140625, 22.111328125, 22.78125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 8.0, 5.0, 10.0, 8.0, 10.0, 17.0, 14.0, 28.0, 41.0, 41.0, 52.0, 82.0, 107.0, 157.0, 282.0, 492.0, 1431.0, 82871.0, 3055627.0, 2450.0, 794.0, 352.0, 208.0, 156.0, 101.0, 84.0, 57.0, 59.0, 45.0, 31.0, 23.0, 23.0, 11.0, 13.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.90625, -57.076171875, -55.24609375, -53.416015625, -51.5859375, -49.755859375, -47.92578125, -46.095703125, -44.265625, -42.435546875, -40.60546875, -38.775390625, -36.9453125, -35.115234375, -33.28515625, -31.455078125, -29.625, -27.794921875, -25.96484375, -24.134765625, -22.3046875, -20.474609375, -18.64453125, -16.814453125, -14.984375, -13.154296875, -11.32421875, -9.494140625, -7.6640625, -5.833984375, -4.00390625, -2.173828125, -0.34375, 1.486328125, 3.31640625, 5.146484375, 6.9765625, 8.806640625, 10.63671875, 12.466796875, 14.296875, 16.126953125, 17.95703125, 19.787109375, 21.6171875, 23.447265625, 25.27734375, 27.107421875, 28.9375, 30.767578125, 32.59765625, 34.427734375, 36.2578125, 38.087890625, 39.91796875, 41.748046875, 43.578125, 45.408203125, 47.23828125, 49.068359375, 50.8984375, 52.728515625, 54.55859375, 56.388671875, 58.21875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 5.0, 14.0, 21.0, 45.0, 88.0, 162.0, 202.0, 192.0, 135.0, 72.0, 42.0, 14.0, 11.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.808773040771484, -58.38242721557617, -56.95608139038086, -55.52973556518555, -54.103389739990234, -52.67704391479492, -51.250701904296875, -49.82435607910156, -48.39801025390625, -46.97166442871094, -45.545318603515625, -44.11897277832031, -42.692626953125, -41.26628112792969, -39.839935302734375, -38.41358947753906, -36.98724365234375, -35.56089782714844, -34.134552001953125, -32.70820617675781, -31.2818603515625, -29.855514526367188, -28.429170608520508, -27.002824783325195, -25.576478958129883, -24.15013313293457, -22.723787307739258, -21.297443389892578, -19.871097564697266, -18.444751739501953, -17.01840591430664, -15.592060089111328, -14.16571044921875, -12.739364624023438, -11.313018798828125, -9.886673927307129, -8.460328102111816, -7.033982276916504, -5.607637405395508, -4.181291580200195, -2.754945755004883, -1.3286001682281494, 0.09774541854858398, 1.5240907669067383, 2.950436592102051, 4.376782417297363, 5.803127288818359, 7.229473114013672, 8.655818939208984, 10.082164764404297, 11.50851058959961, 12.934855461120605, 14.361201286315918, 15.78754711151123, 17.213891983032227, 18.64023780822754, 20.06658363342285, 21.492929458618164, 22.919275283813477, 24.345619201660156, 25.77196502685547, 27.19831085205078, 28.624656677246094, 30.051002502441406, 31.47734832763672]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 7.0, 3.0, 5.0, 6.0, 9.0, 13.0, 14.0, 15.0, 24.0, 19.0, 26.0, 32.0, 32.0, 43.0, 41.0, 58.0, 48.0, 57.0, 52.0, 47.0, 42.0, 47.0, 46.0, 32.0, 44.0, 35.0, 43.0, 24.0, 29.0, 27.0, 14.0, 16.0, 17.0, 11.0, 6.0, 8.0, 6.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.162418365478516, -47.35891342163086, -45.55541229248047, -43.75190734863281, -41.948402404785156, -40.1448974609375, -38.34139633178711, -36.53789138793945, -34.73439025878906, -32.930885314941406, -31.127382278442383, -29.32387924194336, -27.520374298095703, -25.71687126159668, -23.913368225097656, -22.10986328125, -20.306358337402344, -18.50285530090332, -16.699350357055664, -14.89584732055664, -13.0923433303833, -11.288839340209961, -9.485336303710938, -7.681832313537598, -5.878328323364258, -4.074824333190918, -2.2713208198547363, -0.4678173065185547, 1.3356866836547852, 3.139190673828125, 4.942693710327148, 6.746197700500488, 8.549705505371094, 10.353209495544434, 12.156713485717773, 13.960216522216797, 15.763720512390137, 17.567224502563477, 19.3707275390625, 21.174232482910156, 22.97773551940918, 24.781238555908203, 26.58474349975586, 28.388246536254883, 30.191749572753906, 31.995254516601562, 33.79875946044922, 35.60226058959961, 37.405765533447266, 39.20927047729492, 41.01277160644531, 42.81627655029297, 44.619781494140625, 46.42328643798828, 48.22678756713867, 50.03029251098633, 51.83379364013672, 53.637298583984375, 55.440799713134766, 57.24430465698242, 59.04780960083008, 60.85131072998047, 62.654815673828125, 64.45832061767578, 66.26182556152344]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 7.0, 3.0, 2.0, 4.0, 7.0, 12.0, 10.0, 12.0, 17.0, 14.0, 19.0, 20.0, 30.0, 25.0, 41.0, 30.0, 33.0, 34.0, 41.0, 33.0, 36.0, 33.0, 48.0, 32.0, 51.0, 39.0, 32.0, 39.0, 35.0, 25.0, 20.0, 25.0, 32.0, 28.0, 20.0, 19.0, 15.0, 20.0, 5.0, 9.0, 14.0, 10.0, 6.0, 4.0, 1.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-7.69140625, -7.4627685546875, -7.234130859375, -7.0054931640625, -6.77685546875, -6.5482177734375, -6.319580078125, -6.0909423828125, -5.8623046875, -5.6336669921875, -5.405029296875, -5.1763916015625, -4.94775390625, -4.7191162109375, -4.490478515625, -4.2618408203125, -4.033203125, -3.8045654296875, -3.575927734375, -3.3472900390625, -3.11865234375, -2.8900146484375, -2.661376953125, -2.4327392578125, -2.2041015625, -1.9754638671875, -1.746826171875, -1.5181884765625, -1.28955078125, -1.0609130859375, -0.832275390625, -0.6036376953125, -0.375, -0.1463623046875, 0.082275390625, 0.3109130859375, 0.53955078125, 0.7681884765625, 0.996826171875, 1.2254638671875, 1.4541015625, 1.6827392578125, 1.911376953125, 2.1400146484375, 2.36865234375, 2.5972900390625, 2.825927734375, 3.0545654296875, 3.283203125, 3.5118408203125, 3.740478515625, 3.9691162109375, 4.19775390625, 4.4263916015625, 4.655029296875, 4.8836669921875, 5.1123046875, 5.3409423828125, 5.569580078125, 5.7982177734375, 6.02685546875, 6.2554931640625, 6.484130859375, 6.7127685546875, 6.94140625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 9.0, 18.0, 24.0, 19.0, 31.0, 68.0, 81.0, 115.0, 184.0, 259.0, 377.0, 663.0, 1083.0, 2143.0, 4664.0, 13468.0, 65872.0, 571708.0, 2288083.0, 1077510.0, 133167.0, 21795.0, 6663.0, 2708.0, 1380.0, 741.0, 476.0, 307.0, 208.0, 122.0, 94.0, 72.0, 48.0, 36.0, 16.0, 28.0, 12.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.8125, -14.37255859375, -13.9326171875, -13.49267578125, -13.052734375, -12.61279296875, -12.1728515625, -11.73291015625, -11.29296875, -10.85302734375, -10.4130859375, -9.97314453125, -9.533203125, -9.09326171875, -8.6533203125, -8.21337890625, -7.7734375, -7.33349609375, -6.8935546875, -6.45361328125, -6.013671875, -5.57373046875, -5.1337890625, -4.69384765625, -4.25390625, -3.81396484375, -3.3740234375, -2.93408203125, -2.494140625, -2.05419921875, -1.6142578125, -1.17431640625, -0.734375, -0.29443359375, 0.1455078125, 0.58544921875, 1.025390625, 1.46533203125, 1.9052734375, 2.34521484375, 2.78515625, 3.22509765625, 3.6650390625, 4.10498046875, 4.544921875, 4.98486328125, 5.4248046875, 5.86474609375, 6.3046875, 6.74462890625, 7.1845703125, 7.62451171875, 8.064453125, 8.50439453125, 8.9443359375, 9.38427734375, 9.82421875, 10.26416015625, 10.7041015625, 11.14404296875, 11.583984375, 12.02392578125, 12.4638671875, 12.90380859375, 13.34375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 11.0, 38.0, 175.0, 792.0, 2041.0, 773.0, 200.0, 32.0, 15.0, 4.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.78125, -53.82568359375, -51.8701171875, -49.91455078125, -47.958984375, -46.00341796875, -44.0478515625, -42.09228515625, -40.13671875, -38.18115234375, -36.2255859375, -34.27001953125, -32.314453125, -30.35888671875, -28.4033203125, -26.44775390625, -24.4921875, -22.53662109375, -20.5810546875, -18.62548828125, -16.669921875, -14.71435546875, -12.7587890625, -10.80322265625, -8.84765625, -6.89208984375, -4.9365234375, -2.98095703125, -1.025390625, 0.93017578125, 2.8857421875, 4.84130859375, 6.796875, 8.75244140625, 10.7080078125, 12.66357421875, 14.619140625, 16.57470703125, 18.5302734375, 20.48583984375, 22.44140625, 24.39697265625, 26.3525390625, 28.30810546875, 30.263671875, 32.21923828125, 34.1748046875, 36.13037109375, 38.0859375, 40.04150390625, 41.9970703125, 43.95263671875, 45.908203125, 47.86376953125, 49.8193359375, 51.77490234375, 53.73046875, 55.68603515625, 57.6416015625, 59.59716796875, 61.552734375, 63.50830078125, 65.4638671875, 67.41943359375, 69.375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 9.0, 17.0, 67.0, 292.0, 1197.0, 131522.0, 4058794.0, 1840.0, 394.0, 94.0, 26.0, 10.0, 11.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.5, -143.2998046875, -139.099609375, -134.8994140625, -130.69921875, -126.4990234375, -122.298828125, -118.0986328125, -113.8984375, -109.6982421875, -105.498046875, -101.2978515625, -97.09765625, -92.8974609375, -88.697265625, -84.4970703125, -80.296875, -76.0966796875, -71.896484375, -67.6962890625, -63.49609375, -59.2958984375, -55.095703125, -50.8955078125, -46.6953125, -42.4951171875, -38.294921875, -34.0947265625, -29.89453125, -25.6943359375, -21.494140625, -17.2939453125, -13.09375, -8.8935546875, -4.693359375, -0.4931640625, 3.70703125, 7.9072265625, 12.107421875, 16.3076171875, 20.5078125, 24.7080078125, 28.908203125, 33.1083984375, 37.30859375, 41.5087890625, 45.708984375, 49.9091796875, 54.109375, 58.3095703125, 62.509765625, 66.7099609375, 70.91015625, 75.1103515625, 79.310546875, 83.5107421875, 87.7109375, 91.9111328125, 96.111328125, 100.3115234375, 104.51171875, 108.7119140625, 112.912109375, 117.1123046875, 121.3125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 49.0, 211.0, 370.0, 281.0, 84.0, 14.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.54705810546875, -249.79550170898438, -245.04396057128906, -240.2924041748047, -235.54086303710938, -230.789306640625, -226.0377655029297, -221.2862091064453, -216.53466796875, -211.78311157226562, -207.0315704345703, -202.28001403808594, -197.52847290039062, -192.77691650390625, -188.02537536621094, -183.27381896972656, -178.5222625732422, -173.7707061767578, -169.0191650390625, -164.26760864257812, -159.5160675048828, -154.76451110839844, -150.01296997070312, -145.26141357421875, -140.50985717773438, -135.75830078125, -131.0067596435547, -126.25521087646484, -121.503662109375, -116.75210571289062, -112.00055694580078, -107.24900817871094, -102.49746704101562, -97.74591827392578, -92.99436950683594, -88.2428207397461, -83.49127197265625, -78.73971557617188, -73.98816680908203, -69.23661804199219, -64.48507690429688, -59.73352813720703, -54.98197937011719, -50.23042678833008, -45.478878021240234, -40.72732925415039, -35.97577667236328, -31.224227905273438, -26.472675323486328, -21.721126556396484, -16.969575881958008, -12.218026161193848, -7.4664764404296875, -2.7149276733398438, 2.036623001098633, 6.788173675537109, 11.539722442626953, 16.291271209716797, 21.042821884155273, 25.79437255859375, 30.545921325683594, 35.29747009277344, 40.04901885986328, 44.80057144165039, 49.552120208740234]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 6.0, 3.0, 8.0, 7.0, 6.0, 10.0, 19.0, 16.0, 20.0, 24.0, 23.0, 32.0, 38.0, 41.0, 44.0, 37.0, 39.0, 62.0, 56.0, 46.0, 46.0, 52.0, 33.0, 37.0, 42.0, 45.0, 31.0, 18.0, 35.0, 20.0, 19.0, 22.0, 18.0, 10.0, 11.0, 3.0, 9.0, 4.0, 4.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.407440185546875, -53.52639389038086, -51.645347595214844, -49.76430130004883, -47.88325500488281, -46.0022087097168, -44.12116241455078, -42.2401123046875, -40.35906982421875, -38.478023529052734, -36.59697723388672, -34.7159309387207, -32.83488464355469, -30.953838348388672, -29.072790145874023, -27.191743850708008, -25.31069564819336, -23.429649353027344, -21.548603057861328, -19.667556762695312, -17.786510467529297, -15.905463218688965, -14.024415969848633, -12.143369674682617, -10.262323379516602, -8.381277084350586, -6.500230312347412, -4.619183540344238, -2.7381372451782227, -0.857090950012207, 1.023956298828125, 2.9050025939941406, 4.786048889160156, 6.667095184326172, 8.548141479492188, 10.42918872833252, 12.310235023498535, 14.19128131866455, 16.072328567504883, 17.9533748626709, 19.834421157836914, 21.71546745300293, 23.596513748168945, 25.477561950683594, 27.35860824584961, 29.239654541015625, 31.12070083618164, 33.001747131347656, 34.88279342651367, 36.76383972167969, 38.6448860168457, 40.52593231201172, 42.406978607177734, 44.28802490234375, 46.16907501220703, 48.05011749267578, 49.93116760253906, 51.81221389770508, 53.693260192871094, 55.57430648803711, 57.455352783203125, 59.33639907836914, 61.217445373535156, 63.09849548339844, 64.97953796386719]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 10.0, 10.0, 13.0, 10.0, 17.0, 14.0, 21.0, 14.0, 20.0, 20.0, 27.0, 32.0, 27.0, 35.0, 39.0, 43.0, 42.0, 33.0, 44.0, 44.0, 34.0, 36.0, 32.0, 36.0, 31.0, 40.0, 31.0, 38.0, 29.0, 25.0, 22.0, 17.0, 14.0, 23.0, 13.0, 11.0, 11.0, 5.0, 5.0, 12.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.15948486328125, -5.9635009765625, -5.76751708984375, -5.571533203125, -5.37554931640625, -5.1795654296875, -4.98358154296875, -4.78759765625, -4.59161376953125, -4.3956298828125, -4.19964599609375, -4.003662109375, -3.80767822265625, -3.6116943359375, -3.41571044921875, -3.2197265625, -3.02374267578125, -2.8277587890625, -2.63177490234375, -2.435791015625, -2.23980712890625, -2.0438232421875, -1.84783935546875, -1.65185546875, -1.45587158203125, -1.2598876953125, -1.06390380859375, -0.867919921875, -0.67193603515625, -0.4759521484375, -0.27996826171875, -0.083984375, 0.11199951171875, 0.3079833984375, 0.50396728515625, 0.699951171875, 0.89593505859375, 1.0919189453125, 1.28790283203125, 1.48388671875, 1.67987060546875, 1.8758544921875, 2.07183837890625, 2.267822265625, 2.46380615234375, 2.6597900390625, 2.85577392578125, 3.0517578125, 3.24774169921875, 3.4437255859375, 3.63970947265625, 3.835693359375, 4.03167724609375, 4.2276611328125, 4.42364501953125, 4.61962890625, 4.81561279296875, 5.0115966796875, 5.20758056640625, 5.403564453125, 5.59954833984375, 5.7955322265625, 5.99151611328125, 6.1875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 5.0, 8.0, 16.0, 19.0, 29.0, 44.0, 74.0, 88.0, 131.0, 216.0, 277.0, 450.0, 644.0, 948.0, 1406.0, 2149.0, 3152.0, 4638.0, 6974.0, 10212.0, 15095.0, 22629.0, 35035.0, 55085.0, 92685.0, 195531.0, 286580.0, 121785.0, 68045.0, 41994.0, 27369.0, 17973.0, 12057.0, 8235.0, 5507.0, 3769.0, 2480.0, 1715.0, 1115.0, 766.0, 563.0, 327.0, 255.0, 140.0, 106.0, 73.0, 61.0, 37.0, 23.0, 16.0, 8.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-1.244140625, -1.2055206298828125, -1.166900634765625, -1.1282806396484375, -1.08966064453125, -1.0510406494140625, -1.012420654296875, -0.9738006591796875, -0.9351806640625, -0.8965606689453125, -0.857940673828125, -0.8193206787109375, -0.78070068359375, -0.7420806884765625, -0.703460693359375, -0.6648406982421875, -0.626220703125, -0.5876007080078125, -0.548980712890625, -0.5103607177734375, -0.47174072265625, -0.4331207275390625, -0.394500732421875, -0.3558807373046875, -0.3172607421875, -0.2786407470703125, -0.240020751953125, -0.2014007568359375, -0.16278076171875, -0.1241607666015625, -0.085540771484375, -0.0469207763671875, -0.00830078125, 0.0303192138671875, 0.068939208984375, 0.1075592041015625, 0.14617919921875, 0.1847991943359375, 0.223419189453125, 0.2620391845703125, 0.3006591796875, 0.3392791748046875, 0.377899169921875, 0.4165191650390625, 0.45513916015625, 0.4937591552734375, 0.532379150390625, 0.5709991455078125, 0.609619140625, 0.6482391357421875, 0.686859130859375, 0.7254791259765625, 0.76409912109375, 0.8027191162109375, 0.841339111328125, 0.8799591064453125, 0.9185791015625, 0.9571990966796875, 0.995819091796875, 1.0344390869140625, 1.07305908203125, 1.1116790771484375, 1.150299072265625, 1.1889190673828125, 1.2275390625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 8.0, 4.0, 5.0, 12.0, 9.0, 14.0, 10.0, 21.0, 15.0, 28.0, 20.0, 30.0, 28.0, 45.0, 35.0, 34.0, 45.0, 46.0, 53.0, 1078.0, 44.0, 42.0, 41.0, 37.0, 41.0, 38.0, 36.0, 27.0, 31.0, 29.0, 20.0, 28.0, 13.0, 15.0, 9.0, 7.0, 10.0, 6.0, 3.0, 1.0, 3.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0703125, -3.92742919921875, -3.7845458984375, -3.64166259765625, -3.498779296875, -3.35589599609375, -3.2130126953125, -3.07012939453125, -2.92724609375, -2.78436279296875, -2.6414794921875, -2.49859619140625, -2.355712890625, -2.21282958984375, -2.0699462890625, -1.92706298828125, -1.7841796875, -1.64129638671875, -1.4984130859375, -1.35552978515625, -1.212646484375, -1.06976318359375, -0.9268798828125, -0.78399658203125, -0.64111328125, -0.49822998046875, -0.3553466796875, -0.21246337890625, -0.069580078125, 0.07330322265625, 0.2161865234375, 0.35906982421875, 0.501953125, 0.64483642578125, 0.7877197265625, 0.93060302734375, 1.073486328125, 1.21636962890625, 1.3592529296875, 1.50213623046875, 1.64501953125, 1.78790283203125, 1.9307861328125, 2.07366943359375, 2.216552734375, 2.35943603515625, 2.5023193359375, 2.64520263671875, 2.7880859375, 2.93096923828125, 3.0738525390625, 3.21673583984375, 3.359619140625, 3.50250244140625, 3.6453857421875, 3.78826904296875, 3.93115234375, 4.07403564453125, 4.2169189453125, 4.35980224609375, 4.502685546875, 4.64556884765625, 4.7884521484375, 4.93133544921875, 5.07421875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 8.0, 3.0, 1.0, 6.0, 8.0, 11.0, 12.0, 17.0, 29.0, 47.0, 99.0, 146.0, 276.0, 535.0, 1044.0, 1892.0, 3778.0, 7667.0, 15817.0, 33974.0, 77326.0, 220038.0, 1509197.0, 126635.0, 52292.0, 23614.0, 11280.0, 5527.0, 2763.0, 1446.0, 720.0, 402.0, 223.0, 123.0, 60.0, 37.0, 23.0, 25.0, 11.0, 9.0, 5.0, 7.0, 0.0, 7.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.453125, -2.3835601806640625, -2.313995361328125, -2.2444305419921875, -2.17486572265625, -2.1053009033203125, -2.035736083984375, -1.9661712646484375, -1.8966064453125, -1.8270416259765625, -1.757476806640625, -1.6879119873046875, -1.61834716796875, -1.5487823486328125, -1.479217529296875, -1.4096527099609375, -1.340087890625, -1.2705230712890625, -1.200958251953125, -1.1313934326171875, -1.06182861328125, -0.9922637939453125, -0.922698974609375, -0.8531341552734375, -0.7835693359375, -0.7140045166015625, -0.644439697265625, -0.5748748779296875, -0.50531005859375, -0.4357452392578125, -0.366180419921875, -0.2966156005859375, -0.22705078125, -0.1574859619140625, -0.087921142578125, -0.0183563232421875, 0.05120849609375, 0.1207733154296875, 0.190338134765625, 0.2599029541015625, 0.3294677734375, 0.3990325927734375, 0.468597412109375, 0.5381622314453125, 0.60772705078125, 0.6772918701171875, 0.746856689453125, 0.8164215087890625, 0.885986328125, 0.9555511474609375, 1.025115966796875, 1.0946807861328125, 1.16424560546875, 1.2338104248046875, 1.303375244140625, 1.3729400634765625, 1.4425048828125, 1.5120697021484375, 1.581634521484375, 1.6511993408203125, 1.72076416015625, 1.7903289794921875, 1.859893798828125, 1.9294586181640625, 1.9990234375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 4.0, 3.0, 3.0, 9.0, 10.0, 12.0, 12.0, 18.0, 31.0, 29.0, 39.0, 43.0, 62.0, 59.0, 66.0, 85.0, 74.0, 67.0, 68.0, 50.0, 42.0, 37.0, 35.0, 27.0, 24.0, 14.0, 14.0, 8.0, 12.0, 11.0, 6.0, 3.0, 3.0, 7.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009188652038574219, -0.0008891746401786804, -0.000859484076499939, -0.0008297935128211975, -0.0008001029491424561, -0.0007704123854637146, -0.0007407218217849731, -0.0007110312581062317, -0.0006813406944274902, -0.0006516501307487488, -0.0006219595670700073, -0.0005922690033912659, -0.0005625784397125244, -0.000532887876033783, -0.0005031973123550415, -0.00047350674867630005, -0.0004438161849975586, -0.00041412562131881714, -0.0003844350576400757, -0.00035474449396133423, -0.0003250539302825928, -0.0002953633666038513, -0.00026567280292510986, -0.0002359822392463684, -0.00020629167556762695, -0.0001766011118888855, -0.00014691054821014404, -0.00011721998453140259, -8.752942085266113e-05, -5.783885717391968e-05, -2.8148293495178223e-05, 1.5422701835632324e-06, 3.123283386230469e-05, 6.092339754104614e-05, 9.06139612197876e-05, 0.00012030452489852905, 0.0001499950885772705, 0.00017968565225601196, 0.00020937621593475342, 0.00023906677961349487, 0.00026875734329223633, 0.0002984479069709778, 0.00032813847064971924, 0.0003578290343284607, 0.00038751959800720215, 0.0004172101616859436, 0.00044690072536468506, 0.0004765912890434265, 0.000506281852722168, 0.0005359724164009094, 0.0005656629800796509, 0.0005953535437583923, 0.0006250441074371338, 0.0006547346711158752, 0.0006844252347946167, 0.0007141157984733582, 0.0007438063621520996, 0.0007734969258308411, 0.0008031874895095825, 0.000832878053188324, 0.0008625686168670654, 0.0008922591805458069, 0.0009219497442245483, 0.0009516403079032898, 0.0009813308715820312]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 9.0, 15.0, 13.0, 16.0, 16.0, 25.0, 31.0, 34.0, 51.0, 79.0, 95.0, 150.0, 175.0, 262.0, 422.0, 724.0, 2227.0, 1017471.0, 24194.0, 973.0, 500.0, 304.0, 182.0, 150.0, 91.0, 85.0, 50.0, 51.0, 34.0, 24.0, 22.0, 14.0, 8.0, 6.0, 7.0, 6.0, 5.0, 5.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.0192413330078125, -0.018717169761657715, -0.01819300651550293, -0.017668843269348145, -0.01714468002319336, -0.016620516777038574, -0.01609635353088379, -0.015572190284729004, -0.015048027038574219, -0.014523863792419434, -0.013999700546264648, -0.013475537300109863, -0.012951374053955078, -0.012427210807800293, -0.011903047561645508, -0.011378884315490723, -0.010854721069335938, -0.010330557823181152, -0.009806394577026367, -0.009282231330871582, -0.008758068084716797, -0.008233904838562012, -0.0077097415924072266, -0.007185578346252441, -0.006661415100097656, -0.006137251853942871, -0.005613088607788086, -0.005088925361633301, -0.004564762115478516, -0.0040405988693237305, -0.0035164356231689453, -0.00299227237701416, -0.002468109130859375, -0.0019439458847045898, -0.0014197826385498047, -0.0008956193923950195, -0.0003714561462402344, 0.00015270709991455078, 0.0006768703460693359, 0.001201033592224121, 0.0017251968383789062, 0.0022493600845336914, 0.0027735233306884766, 0.0032976865768432617, 0.003821849822998047, 0.004346013069152832, 0.004870176315307617, 0.005394339561462402, 0.0059185028076171875, 0.006442666053771973, 0.006966829299926758, 0.007490992546081543, 0.008015155792236328, 0.008539319038391113, 0.009063482284545898, 0.009587645530700684, 0.010111808776855469, 0.010635972023010254, 0.011160135269165039, 0.011684298515319824, 0.01220846176147461, 0.012732625007629395, 0.01325678825378418, 0.013780951499938965, 0.01430511474609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 15.0, 106.0, 404.0, 377.0, 91.0, 16.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0023517096415162086, -0.0023026899434626102, -0.002253670245409012, -0.0022046505473554134, -0.002155630849301815, -0.0021066111512482166, -0.0020575914531946182, -0.0020085719879716635, -0.001959552289918065, -0.0019105325918644667, -0.0018615128938108683, -0.0018124931957572699, -0.0017634736141189933, -0.0017144539160653949, -0.0016654342180117965, -0.001616414519958198, -0.0015673948219045997, -0.0015183751238510013, -0.0014693554257974029, -0.0014203358441591263, -0.0013713161461055279, -0.0013222964480519295, -0.001273276749998331, -0.0012242570519447327, -0.0011752373538911343, -0.0011262176558375359, -0.0010771979577839375, -0.001028178259730339, -0.0009791586780920625, -0.0009301389800384641, -0.0008811192819848657, -0.0008320995839312673, -0.0007830800022929907, -0.0007340603042393923, -0.0006850406643934548, -0.0006360209663398564, -0.0005870013264939189, -0.0005379816284403205, -0.0004889619303867221, -0.00043994226143695414, -0.0003909225924871862, -0.00034190292353741825, -0.0002928832545876503, -0.0002438635565340519, -0.00019484388758428395, -0.000145824218634516, -9.68045205809176e-05, -4.778485163114965e-05, 1.2348173186182976e-06, 5.025449354434386e-05, 9.927416977006942e-05, 0.0001482938532717526, 0.00019731352222152054, 0.0002463331911712885, 0.0002953528892248869, 0.00034437255817465484, 0.0003933922271244228, 0.00044241189607419074, 0.0004914315650239587, 0.0005404512630775571, 0.0005894709611311555, 0.000638490600977093, 0.0006875102990306914, 0.0007365299388766289, 0.0007855496369302273]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 5.0, 6.0, 6.0, 8.0, 13.0, 18.0, 13.0, 20.0, 17.0, 16.0, 24.0, 28.0, 29.0, 34.0, 38.0, 40.0, 36.0, 53.0, 39.0, 35.0, 37.0, 34.0, 42.0, 53.0, 35.0, 32.0, 28.0, 30.0, 28.0, 26.0, 30.0, 29.0, 23.0, 13.0, 15.0, 12.0, 11.0, 11.0, 6.0, 4.0, 7.0, 9.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00043016672134399414, -0.00041640177369117737, -0.0004026368260383606, -0.0003888718783855438, -0.00037510693073272705, -0.0003613419830799103, -0.0003475770354270935, -0.00033381208777427673, -0.00032004714012145996, -0.0003062821924686432, -0.0002925172448158264, -0.00027875229716300964, -0.00026498734951019287, -0.0002512224018573761, -0.00023745745420455933, -0.00022369250655174255, -0.00020992755889892578, -0.000196162611246109, -0.00018239766359329224, -0.00016863271594047546, -0.0001548677682876587, -0.00014110282063484192, -0.00012733787298202515, -0.00011357292532920837, -9.98079776763916e-05, -8.604303002357483e-05, -7.227808237075806e-05, -5.8513134717941284e-05, -4.474818706512451e-05, -3.098323941230774e-05, -1.7218291759490967e-05, -3.4533441066741943e-06, 1.0311603546142578e-05, 2.407655119895935e-05, 3.784149885177612e-05, 5.1606446504592896e-05, 6.537139415740967e-05, 7.913634181022644e-05, 9.290128946304321e-05, 0.00010666623711585999, 0.00012043118476867676, 0.00013419613242149353, 0.0001479610800743103, 0.00016172602772712708, 0.00017549097537994385, 0.00018925592303276062, 0.0002030208706855774, 0.00021678581833839417, 0.00023055076599121094, 0.0002443157136440277, 0.0002580806612968445, 0.00027184560894966125, 0.00028561055660247803, 0.0002993755042552948, 0.00031314045190811157, 0.00032690539956092834, 0.0003406703472137451, 0.0003544352948665619, 0.00036820024251937866, 0.00038196519017219543, 0.0003957301378250122, 0.000409495085477829, 0.00042326003313064575, 0.0004370249807834625, 0.0004507899284362793]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 10.0, 10.0, 13.0, 10.0, 17.0, 14.0, 21.0, 14.0, 20.0, 20.0, 27.0, 32.0, 27.0, 35.0, 39.0, 43.0, 42.0, 33.0, 44.0, 43.0, 35.0, 36.0, 32.0, 36.0, 31.0, 40.0, 31.0, 38.0, 29.0, 25.0, 22.0, 17.0, 14.0, 23.0, 13.0, 11.0, 11.0, 5.0, 5.0, 12.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.35546875, -6.15948486328125, -5.9635009765625, -5.76751708984375, -5.571533203125, -5.37554931640625, -5.1795654296875, -4.98358154296875, -4.78759765625, -4.59161376953125, -4.3956298828125, -4.19964599609375, -4.003662109375, -3.80767822265625, -3.6116943359375, -3.41571044921875, -3.2197265625, -3.02374267578125, -2.8277587890625, -2.63177490234375, -2.435791015625, -2.23980712890625, -2.0438232421875, -1.84783935546875, -1.65185546875, -1.45587158203125, -1.2598876953125, -1.06390380859375, -0.867919921875, -0.67193603515625, -0.4759521484375, -0.27996826171875, -0.083984375, 0.11199951171875, 0.3079833984375, 0.50396728515625, 0.699951171875, 0.89593505859375, 1.0919189453125, 1.28790283203125, 1.48388671875, 1.67987060546875, 1.8758544921875, 2.07183837890625, 2.267822265625, 2.46380615234375, 2.6597900390625, 2.85577392578125, 3.0517578125, 3.24774169921875, 3.4437255859375, 3.63970947265625, 3.835693359375, 4.03167724609375, 4.2276611328125, 4.42364501953125, 4.61962890625, 4.81561279296875, 5.0115966796875, 5.20758056640625, 5.403564453125, 5.59954833984375, 5.7955322265625, 5.99151611328125, 6.1875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 3.0, 13.0, 8.0, 5.0, 15.0, 18.0, 24.0, 29.0, 34.0, 56.0, 74.0, 96.0, 103.0, 160.0, 253.0, 326.0, 458.0, 754.0, 1182.0, 2092.0, 4498.0, 10765.0, 31840.0, 124712.0, 557562.0, 233672.0, 50726.0, 15867.0, 6109.0, 2736.0, 1550.0, 853.0, 593.0, 387.0, 265.0, 185.0, 140.0, 103.0, 72.0, 46.0, 40.0, 30.0, 24.0, 15.0, 21.0, 17.0, 4.0, 10.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-11.3046875, -10.9691162109375, -10.633544921875, -10.2979736328125, -9.96240234375, -9.6268310546875, -9.291259765625, -8.9556884765625, -8.6201171875, -8.2845458984375, -7.948974609375, -7.6134033203125, -7.27783203125, -6.9422607421875, -6.606689453125, -6.2711181640625, -5.935546875, -5.5999755859375, -5.264404296875, -4.9288330078125, -4.59326171875, -4.2576904296875, -3.922119140625, -3.5865478515625, -3.2509765625, -2.9154052734375, -2.579833984375, -2.2442626953125, -1.90869140625, -1.5731201171875, -1.237548828125, -0.9019775390625, -0.56640625, -0.2308349609375, 0.104736328125, 0.4403076171875, 0.77587890625, 1.1114501953125, 1.447021484375, 1.7825927734375, 2.1181640625, 2.4537353515625, 2.789306640625, 3.1248779296875, 3.46044921875, 3.7960205078125, 4.131591796875, 4.4671630859375, 4.802734375, 5.1383056640625, 5.473876953125, 5.8094482421875, 6.14501953125, 6.4805908203125, 6.816162109375, 7.1517333984375, 7.4873046875, 7.8228759765625, 8.158447265625, 8.4940185546875, 8.82958984375, 9.1651611328125, 9.500732421875, 9.8363037109375, 10.171875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 16.0, 8.0, 17.0, 24.0, 22.0, 26.0, 27.0, 29.0, 50.0, 51.0, 55.0, 57.0, 126.0, 1680.0, 348.0, 83.0, 50.0, 55.0, 50.0, 50.0, 44.0, 25.0, 18.0, 23.0, 27.0, 14.0, 7.0, 11.0, 5.0, 7.0, 3.0, 3.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.25, -16.670166015625, -16.09033203125, -15.510498046875, -14.9306640625, -14.350830078125, -13.77099609375, -13.191162109375, -12.611328125, -12.031494140625, -11.45166015625, -10.871826171875, -10.2919921875, -9.712158203125, -9.13232421875, -8.552490234375, -7.97265625, -7.392822265625, -6.81298828125, -6.233154296875, -5.6533203125, -5.073486328125, -4.49365234375, -3.913818359375, -3.333984375, -2.754150390625, -2.17431640625, -1.594482421875, -1.0146484375, -0.434814453125, 0.14501953125, 0.724853515625, 1.3046875, 1.884521484375, 2.46435546875, 3.044189453125, 3.6240234375, 4.203857421875, 4.78369140625, 5.363525390625, 5.943359375, 6.523193359375, 7.10302734375, 7.682861328125, 8.2626953125, 8.842529296875, 9.42236328125, 10.002197265625, 10.58203125, 11.161865234375, 11.74169921875, 12.321533203125, 12.9013671875, 13.481201171875, 14.06103515625, 14.640869140625, 15.220703125, 15.800537109375, 16.38037109375, 16.960205078125, 17.5400390625, 18.119873046875, 18.69970703125, 19.279541015625, 19.859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 4.0, 4.0, 6.0, 6.0, 6.0, 16.0, 11.0, 14.0, 26.0, 28.0, 40.0, 54.0, 82.0, 110.0, 200.0, 354.0, 655.0, 2129.0, 2987287.0, 151983.0, 1399.0, 496.0, 275.0, 158.0, 101.0, 70.0, 33.0, 37.0, 20.0, 25.0, 18.0, 7.0, 10.0, 7.0, 10.0, 1.0, 7.0, 4.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-54.21875, -52.66455078125, -51.1103515625, -49.55615234375, -48.001953125, -46.44775390625, -44.8935546875, -43.33935546875, -41.78515625, -40.23095703125, -38.6767578125, -37.12255859375, -35.568359375, -34.01416015625, -32.4599609375, -30.90576171875, -29.3515625, -27.79736328125, -26.2431640625, -24.68896484375, -23.134765625, -21.58056640625, -20.0263671875, -18.47216796875, -16.91796875, -15.36376953125, -13.8095703125, -12.25537109375, -10.701171875, -9.14697265625, -7.5927734375, -6.03857421875, -4.484375, -2.93017578125, -1.3759765625, 0.17822265625, 1.732421875, 3.28662109375, 4.8408203125, 6.39501953125, 7.94921875, 9.50341796875, 11.0576171875, 12.61181640625, 14.166015625, 15.72021484375, 17.2744140625, 18.82861328125, 20.3828125, 21.93701171875, 23.4912109375, 25.04541015625, 26.599609375, 28.15380859375, 29.7080078125, 31.26220703125, 32.81640625, 34.37060546875, 35.9248046875, 37.47900390625, 39.033203125, 40.58740234375, 42.1416015625, 43.69580078125, 45.25]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 12.0, 384.0, 603.0, 16.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.13548469543457, -13.705301284790039, -9.275118827819824, -4.844936370849609, -0.4147529602050781, 4.015430450439453, 8.445611953735352, 12.875795364379883, 17.305978775024414, 21.736162185668945, 26.166343688964844, 30.596527099609375, 35.026710510253906, 39.45689392089844, 43.88707733154297, 48.3172607421875, 52.74744415283203, 57.17762756347656, 61.607810974121094, 66.03799438476562, 70.46817779541016, 74.89836120605469, 79.32853698730469, 83.75872802734375, 88.18890380859375, 92.61908721923828, 97.04927062988281, 101.47945404052734, 105.90963745117188, 110.3398208618164, 114.77000427246094, 119.20018005371094, 123.63035583496094, 128.06053161621094, 132.49072265625, 136.9208984375, 141.35108947753906, 145.78126525878906, 150.21145629882812, 154.64163208007812, 159.0718231201172, 163.5019989013672, 167.93218994140625, 172.36236572265625, 176.7925567626953, 181.2227325439453, 185.65292358398438, 190.08309936523438, 194.51327514648438, 198.94345092773438, 203.37364196777344, 207.80381774902344, 212.2340087890625, 216.6641845703125, 221.09437561035156, 225.52455139160156, 229.95474243164062, 234.38491821289062, 238.8151092529297, 243.2452850341797, 247.67547607421875, 252.10565185546875, 256.53582763671875, 260.9660339355469, 265.3962097167969]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 6.0, 6.0, 13.0, 10.0, 16.0, 11.0, 19.0, 17.0, 19.0, 25.0, 30.0, 25.0, 27.0, 33.0, 40.0, 40.0, 39.0, 48.0, 40.0, 39.0, 54.0, 47.0, 46.0, 37.0, 38.0, 25.0, 30.0, 31.0, 20.0, 30.0, 20.0, 19.0, 10.0, 12.0, 14.0, 13.0, 8.0, 12.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0], "bins": [-35.401763916015625, -34.20891189575195, -33.01605987548828, -31.823205947875977, -30.630352020263672, -29.4375, -28.244647979736328, -27.051795959472656, -25.85894203186035, -24.66609001159668, -23.473236083984375, -22.280384063720703, -21.08753204345703, -19.894678115844727, -18.701826095581055, -17.50897216796875, -16.316120147705078, -15.12326717376709, -13.930414199829102, -12.73756217956543, -11.544709205627441, -10.351856231689453, -9.159004211425781, -7.966151237487793, -6.773298263549805, -5.580445289611816, -4.387592792510986, -3.194740056991577, -2.001887321472168, -0.8090343475341797, 0.3838181495666504, 1.5766706466674805, 2.769519805908203, 3.9623725414276123, 5.1552252769470215, 6.348077774047852, 7.54093074798584, 8.733783721923828, 9.9266357421875, 11.119488716125488, 12.312341690063477, 13.505194664001465, 14.698047637939453, 15.890899658203125, 17.083751678466797, 18.2766056060791, 19.469457626342773, 20.662311553955078, 21.85516357421875, 23.048015594482422, 24.240869522094727, 25.4337215423584, 26.626575469970703, 27.819427490234375, 29.012279510498047, 30.20513153076172, 31.397985458374023, 32.59083938598633, 33.78369140625, 34.97654342651367, 36.169395446777344, 37.36225128173828, 38.55510330200195, 39.747955322265625, 40.9408073425293]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 6.0, 4.0, 10.0, 8.0, 16.0, 16.0, 15.0, 14.0, 20.0, 23.0, 25.0, 43.0, 39.0, 31.0, 37.0, 45.0, 42.0, 39.0, 45.0, 29.0, 39.0, 52.0, 39.0, 36.0, 39.0, 38.0, 31.0, 31.0, 29.0, 27.0, 22.0, 16.0, 17.0, 17.0, 15.0, 12.0, 8.0, 3.0, 5.0, 4.0, 6.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-8.4765625, -8.23736572265625, -7.9981689453125, -7.75897216796875, -7.519775390625, -7.28057861328125, -7.0413818359375, -6.80218505859375, -6.56298828125, -6.32379150390625, -6.0845947265625, -5.84539794921875, -5.606201171875, -5.36700439453125, -5.1278076171875, -4.88861083984375, -4.6494140625, -4.41021728515625, -4.1710205078125, -3.93182373046875, -3.692626953125, -3.45343017578125, -3.2142333984375, -2.97503662109375, -2.73583984375, -2.49664306640625, -2.2574462890625, -2.01824951171875, -1.779052734375, -1.53985595703125, -1.3006591796875, -1.06146240234375, -0.822265625, -0.58306884765625, -0.3438720703125, -0.10467529296875, 0.134521484375, 0.37371826171875, 0.6129150390625, 0.85211181640625, 1.09130859375, 1.33050537109375, 1.5697021484375, 1.80889892578125, 2.048095703125, 2.28729248046875, 2.5264892578125, 2.76568603515625, 3.0048828125, 3.24407958984375, 3.4832763671875, 3.72247314453125, 3.961669921875, 4.20086669921875, 4.4400634765625, 4.67926025390625, 4.91845703125, 5.15765380859375, 5.3968505859375, 5.63604736328125, 5.875244140625, 6.11444091796875, 6.3536376953125, 6.59283447265625, 6.83203125]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 6.0, 6.0, 12.0, 8.0, 19.0, 27.0, 27.0, 49.0, 52.0, 75.0, 79.0, 110.0, 150.0, 200.0, 261.0, 350.0, 542.0, 910.0, 2046.0, 15041.0, 2632389.0, 1528010.0, 9433.0, 1765.0, 839.0, 482.0, 373.0, 261.0, 168.0, 115.0, 92.0, 86.0, 70.0, 54.0, 40.0, 31.0, 28.0, 19.0, 15.0, 11.0, 8.0, 5.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-45.84375, -44.40771484375, -42.9716796875, -41.53564453125, -40.099609375, -38.66357421875, -37.2275390625, -35.79150390625, -34.35546875, -32.91943359375, -31.4833984375, -30.04736328125, -28.611328125, -27.17529296875, -25.7392578125, -24.30322265625, -22.8671875, -21.43115234375, -19.9951171875, -18.55908203125, -17.123046875, -15.68701171875, -14.2509765625, -12.81494140625, -11.37890625, -9.94287109375, -8.5068359375, -7.07080078125, -5.634765625, -4.19873046875, -2.7626953125, -1.32666015625, 0.109375, 1.54541015625, 2.9814453125, 4.41748046875, 5.853515625, 7.28955078125, 8.7255859375, 10.16162109375, 11.59765625, 13.03369140625, 14.4697265625, 15.90576171875, 17.341796875, 18.77783203125, 20.2138671875, 21.64990234375, 23.0859375, 24.52197265625, 25.9580078125, 27.39404296875, 28.830078125, 30.26611328125, 31.7021484375, 33.13818359375, 34.57421875, 36.01025390625, 37.4462890625, 38.88232421875, 40.318359375, 41.75439453125, 43.1904296875, 44.62646484375, 46.0625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 13.0, 7.0, 16.0, 19.0, 34.0, 92.0, 166.0, 347.0, 683.0, 1049.0, 798.0, 443.0, 216.0, 84.0, 57.0, 26.0, 8.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.375, -23.628662109375, -22.88232421875, -22.135986328125, -21.3896484375, -20.643310546875, -19.89697265625, -19.150634765625, -18.404296875, -17.657958984375, -16.91162109375, -16.165283203125, -15.4189453125, -14.672607421875, -13.92626953125, -13.179931640625, -12.43359375, -11.687255859375, -10.94091796875, -10.194580078125, -9.4482421875, -8.701904296875, -7.95556640625, -7.209228515625, -6.462890625, -5.716552734375, -4.97021484375, -4.223876953125, -3.4775390625, -2.731201171875, -1.98486328125, -1.238525390625, -0.4921875, 0.254150390625, 1.00048828125, 1.746826171875, 2.4931640625, 3.239501953125, 3.98583984375, 4.732177734375, 5.478515625, 6.224853515625, 6.97119140625, 7.717529296875, 8.4638671875, 9.210205078125, 9.95654296875, 10.702880859375, 11.44921875, 12.195556640625, 12.94189453125, 13.688232421875, 14.4345703125, 15.180908203125, 15.92724609375, 16.673583984375, 17.419921875, 18.166259765625, 18.91259765625, 19.658935546875, 20.4052734375, 21.151611328125, 21.89794921875, 22.644287109375, 23.390625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 12.0, 29.0, 36.0, 69.0, 176.0, 430.0, 1422.0, 9175.0, 235978.0, 3834128.0, 105051.0, 5908.0, 1149.0, 400.0, 136.0, 59.0, 33.0, 19.0, 13.0, 10.0, 10.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.46875, -26.53466796875, -25.6005859375, -24.66650390625, -23.732421875, -22.79833984375, -21.8642578125, -20.93017578125, -19.99609375, -19.06201171875, -18.1279296875, -17.19384765625, -16.259765625, -15.32568359375, -14.3916015625, -13.45751953125, -12.5234375, -11.58935546875, -10.6552734375, -9.72119140625, -8.787109375, -7.85302734375, -6.9189453125, -5.98486328125, -5.05078125, -4.11669921875, -3.1826171875, -2.24853515625, -1.314453125, -0.38037109375, 0.5537109375, 1.48779296875, 2.421875, 3.35595703125, 4.2900390625, 5.22412109375, 6.158203125, 7.09228515625, 8.0263671875, 8.96044921875, 9.89453125, 10.82861328125, 11.7626953125, 12.69677734375, 13.630859375, 14.56494140625, 15.4990234375, 16.43310546875, 17.3671875, 18.30126953125, 19.2353515625, 20.16943359375, 21.103515625, 22.03759765625, 22.9716796875, 23.90576171875, 24.83984375, 25.77392578125, 26.7080078125, 27.64208984375, 28.576171875, 29.51025390625, 30.4443359375, 31.37841796875, 32.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 9.0, 7.0, 17.0, 18.0, 25.0, 51.0, 66.0, 83.0, 118.0, 115.0, 127.0, 122.0, 76.0, 48.0, 49.0, 32.0, 15.0, 8.0, 7.0, 4.0, 6.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.04447174072266, -85.04766082763672, -82.05084991455078, -79.05403137207031, -76.05722045898438, -73.06040954589844, -70.0635986328125, -67.06678771972656, -64.06997680664062, -61.07316589355469, -58.076351165771484, -55.07954025268555, -52.08272933959961, -49.085914611816406, -46.08910369873047, -43.09229278564453, -40.09547805786133, -37.09866714477539, -34.10185241699219, -31.10504150390625, -28.108230590820312, -25.111417770385742, -22.114604949951172, -19.117794036865234, -16.120981216430664, -13.12416934967041, -10.127357482910156, -7.130544662475586, -4.133732795715332, -1.1369209289550781, 1.8598918914794922, 4.85670280456543, 7.853515625, 10.850327491760254, 13.847139358520508, 16.843952178955078, 19.840763092041016, 22.837575912475586, 25.834388732910156, 28.831199645996094, 31.828012466430664, 34.824825286865234, 37.82163619995117, 40.818450927734375, 43.81526184082031, 46.81207275390625, 49.80888366699219, 52.805694580078125, 55.80250930786133, 58.799320220947266, 61.79613494873047, 64.7929458618164, 67.78975677490234, 70.78656768798828, 73.78338623046875, 76.78019714355469, 79.77700805664062, 82.77381896972656, 85.7706298828125, 88.76744079589844, 91.7642593383789, 94.76107025146484, 97.75788116455078, 100.75469207763672, 103.75150299072266]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 10.0, 12.0, 6.0, 13.0, 17.0, 17.0, 16.0, 28.0, 33.0, 45.0, 42.0, 67.0, 49.0, 71.0, 59.0, 63.0, 50.0, 61.0, 45.0, 41.0, 37.0, 36.0, 39.0, 25.0, 31.0, 29.0, 8.0, 11.0, 11.0, 5.0, 3.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.209495544433594, -56.39618682861328, -54.5828742980957, -52.76956558227539, -50.95625305175781, -49.1429443359375, -47.32963562011719, -45.51632308959961, -43.70301055908203, -41.88970184326172, -40.07638931274414, -38.26308059692383, -36.44976806640625, -34.63645935058594, -32.823150634765625, -31.009838104248047, -29.196529388427734, -27.38321876525879, -25.569908142089844, -23.75659942626953, -21.943286895751953, -20.12997817993164, -18.316667556762695, -16.50335693359375, -14.690046310424805, -12.87673568725586, -11.063425064086914, -9.250115394592285, -7.43680477142334, -5.6234941482543945, -3.8101844787597656, -1.9968738555908203, -0.18356704711914062, 1.6297433376312256, 3.443053722381592, 5.256363868713379, 7.069674491882324, 8.88298511505127, 10.696294784545898, 12.509605407714844, 14.322916030883789, 16.136226654052734, 17.94953727722168, 19.762847900390625, 21.576156616210938, 23.389469146728516, 25.202777862548828, 27.016088485717773, 28.82939910888672, 30.642709732055664, 32.45602035522461, 34.26932907104492, 36.0826416015625, 37.89595031738281, 39.709259033203125, 41.5225715637207, 43.33588409423828, 45.149192810058594, 46.96250534057617, 48.775814056396484, 50.58912658691406, 52.402435302734375, 54.21574401855469, 56.029056549072266, 57.84236526489258]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 7.0, 5.0, 6.0, 8.0, 13.0, 4.0, 6.0, 15.0, 21.0, 26.0, 27.0, 28.0, 31.0, 49.0, 47.0, 49.0, 54.0, 49.0, 55.0, 53.0, 55.0, 48.0, 37.0, 33.0, 34.0, 25.0, 35.0, 41.0, 31.0, 15.0, 24.0, 14.0, 11.0, 9.0, 9.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.125, -79.7744140625, -77.423828125, -75.0732421875, -72.72265625, -70.3720703125, -68.021484375, -65.6708984375, -63.3203125, -60.9697265625, -58.619140625, -56.2685546875, -53.91796875, -51.5673828125, -49.216796875, -46.8662109375, -44.515625, -42.1650390625, -39.814453125, -37.4638671875, -35.11328125, -32.7626953125, -30.412109375, -28.0615234375, -25.7109375, -23.3603515625, -21.009765625, -18.6591796875, -16.30859375, -13.9580078125, -11.607421875, -9.2568359375, -6.90625, -4.5556640625, -2.205078125, 0.1455078125, 2.49609375, 4.8466796875, 7.197265625, 9.5478515625, 11.8984375, 14.2490234375, 16.599609375, 18.9501953125, 21.30078125, 23.6513671875, 26.001953125, 28.3525390625, 30.703125, 33.0537109375, 35.404296875, 37.7548828125, 40.10546875, 42.4560546875, 44.806640625, 47.1572265625, 49.5078125, 51.8583984375, 54.208984375, 56.5595703125, 58.91015625, 61.2607421875, 63.611328125, 65.9619140625, 68.3125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 4.0, 3.0, 10.0, 12.0, 24.0, 28.0, 29.0, 54.0, 68.0, 81.0, 117.0, 156.0, 257.0, 353.0, 572.0, 827.0, 1236.0, 1824.0, 2951.0, 4760.0, 8031.0, 13636.0, 23941.0, 44368.0, 85429.0, 200579.0, 378101.0, 135016.0, 64049.0, 34202.0, 19000.0, 11070.0, 6624.0, 4005.0, 2421.0, 1629.0, 1002.0, 701.0, 448.0, 283.0, 201.0, 141.0, 84.0, 85.0, 49.0, 27.0, 25.0, 19.0, 13.0, 4.0, 6.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.4296875, -13.9371337890625, -13.444580078125, -12.9520263671875, -12.45947265625, -11.9669189453125, -11.474365234375, -10.9818115234375, -10.4892578125, -9.9967041015625, -9.504150390625, -9.0115966796875, -8.51904296875, -8.0264892578125, -7.533935546875, -7.0413818359375, -6.548828125, -6.0562744140625, -5.563720703125, -5.0711669921875, -4.57861328125, -4.0860595703125, -3.593505859375, -3.1009521484375, -2.6083984375, -2.1158447265625, -1.623291015625, -1.1307373046875, -0.63818359375, -0.1456298828125, 0.346923828125, 0.8394775390625, 1.33203125, 1.8245849609375, 2.317138671875, 2.8096923828125, 3.30224609375, 3.7947998046875, 4.287353515625, 4.7799072265625, 5.2724609375, 5.7650146484375, 6.257568359375, 6.7501220703125, 7.24267578125, 7.7352294921875, 8.227783203125, 8.7203369140625, 9.212890625, 9.7054443359375, 10.197998046875, 10.6905517578125, 11.18310546875, 11.6756591796875, 12.168212890625, 12.6607666015625, 13.1533203125, 13.6458740234375, 14.138427734375, 14.6309814453125, 15.12353515625, 15.6160888671875, 16.108642578125, 16.6011962890625, 17.09375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 5.0, 5.0, 3.0, 9.0, 11.0, 16.0, 10.0, 11.0, 18.0, 18.0, 21.0, 27.0, 17.0, 20.0, 33.0, 23.0, 32.0, 32.0, 37.0, 31.0, 37.0, 39.0, 1068.0, 34.0, 33.0, 32.0, 48.0, 19.0, 32.0, 30.0, 35.0, 31.0, 21.0, 22.0, 21.0, 24.0, 21.0, 12.0, 10.0, 18.0, 13.0, 8.0, 5.0, 5.0, 9.0, 4.0, 5.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.4375, -33.28564453125, -32.1337890625, -30.98193359375, -29.830078125, -28.67822265625, -27.5263671875, -26.37451171875, -25.22265625, -24.07080078125, -22.9189453125, -21.76708984375, -20.615234375, -19.46337890625, -18.3115234375, -17.15966796875, -16.0078125, -14.85595703125, -13.7041015625, -12.55224609375, -11.400390625, -10.24853515625, -9.0966796875, -7.94482421875, -6.79296875, -5.64111328125, -4.4892578125, -3.33740234375, -2.185546875, -1.03369140625, 0.1181640625, 1.27001953125, 2.421875, 3.57373046875, 4.7255859375, 5.87744140625, 7.029296875, 8.18115234375, 9.3330078125, 10.48486328125, 11.63671875, 12.78857421875, 13.9404296875, 15.09228515625, 16.244140625, 17.39599609375, 18.5478515625, 19.69970703125, 20.8515625, 22.00341796875, 23.1552734375, 24.30712890625, 25.458984375, 26.61083984375, 27.7626953125, 28.91455078125, 30.06640625, 31.21826171875, 32.3701171875, 33.52197265625, 34.673828125, 35.82568359375, 36.9775390625, 38.12939453125, 39.28125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 4.0, 4.0, 6.0, 3.0, 8.0, 7.0, 5.0, 11.0, 11.0, 21.0, 25.0, 44.0, 78.0, 130.0, 247.0, 443.0, 735.0, 1307.0, 2374.0, 4054.0, 7525.0, 13612.0, 24912.0, 46908.0, 94885.0, 261640.0, 1405847.0, 114009.0, 54509.0, 28583.0, 15585.0, 8632.0, 4749.0, 2627.0, 1538.0, 842.0, 502.0, 286.0, 174.0, 86.0, 53.0, 26.0, 25.0, 15.0, 14.0, 9.0, 4.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 2.0], "bins": [-19.046875, -18.488525390625, -17.93017578125, -17.371826171875, -16.8134765625, -16.255126953125, -15.69677734375, -15.138427734375, -14.580078125, -14.021728515625, -13.46337890625, -12.905029296875, -12.3466796875, -11.788330078125, -11.22998046875, -10.671630859375, -10.11328125, -9.554931640625, -8.99658203125, -8.438232421875, -7.8798828125, -7.321533203125, -6.76318359375, -6.204833984375, -5.646484375, -5.088134765625, -4.52978515625, -3.971435546875, -3.4130859375, -2.854736328125, -2.29638671875, -1.738037109375, -1.1796875, -0.621337890625, -0.06298828125, 0.495361328125, 1.0537109375, 1.612060546875, 2.17041015625, 2.728759765625, 3.287109375, 3.845458984375, 4.40380859375, 4.962158203125, 5.5205078125, 6.078857421875, 6.63720703125, 7.195556640625, 7.75390625, 8.312255859375, 8.87060546875, 9.428955078125, 9.9873046875, 10.545654296875, 11.10400390625, 11.662353515625, 12.220703125, 12.779052734375, 13.33740234375, 13.895751953125, 14.4541015625, 15.012451171875, 15.57080078125, 16.129150390625, 16.6875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 8.0, 8.0, 6.0, 10.0, 18.0, 15.0, 22.0, 27.0, 33.0, 46.0, 53.0, 64.0, 77.0, 83.0, 79.0, 79.0, 64.0, 63.0, 62.0, 31.0, 23.0, 16.0, 19.0, 11.0, 9.0, 14.0, 11.0, 6.0, 17.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0080413818359375, -0.007733821868896484, -0.007426261901855469, -0.007118701934814453, -0.0068111419677734375, -0.006503582000732422, -0.006196022033691406, -0.005888462066650391, -0.005580902099609375, -0.005273342132568359, -0.004965782165527344, -0.004658222198486328, -0.0043506622314453125, -0.004043102264404297, -0.0037355422973632812, -0.0034279823303222656, -0.00312042236328125, -0.0028128623962402344, -0.0025053024291992188, -0.002197742462158203, -0.0018901824951171875, -0.0015826225280761719, -0.0012750625610351562, -0.0009675025939941406, -0.000659942626953125, -0.0003523826599121094, -4.482269287109375e-05, 0.0002627372741699219, 0.0005702972412109375, 0.0008778572082519531, 0.0011854171752929688, 0.0014929771423339844, 0.001800537109375, 0.0021080970764160156, 0.0024156570434570312, 0.002723217010498047, 0.0030307769775390625, 0.003338336944580078, 0.0036458969116210938, 0.003953456878662109, 0.004261016845703125, 0.004568576812744141, 0.004876136779785156, 0.005183696746826172, 0.0054912567138671875, 0.005798816680908203, 0.006106376647949219, 0.006413936614990234, 0.00672149658203125, 0.007029056549072266, 0.007336616516113281, 0.007644176483154297, 0.007951736450195312, 0.008259296417236328, 0.008566856384277344, 0.00887441635131836, 0.009181976318359375, 0.00948953628540039, 0.009797096252441406, 0.010104656219482422, 0.010412216186523438, 0.010719776153564453, 0.011027336120605469, 0.011334896087646484, 0.0116424560546875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 3.0, 5.0, 11.0, 16.0, 21.0, 9.0, 25.0, 32.0, 43.0, 61.0, 81.0, 119.0, 151.0, 230.0, 370.0, 702.0, 1691.0, 5710.0, 26035.0, 159156.0, 631904.0, 182850.0, 29095.0, 6405.0, 1856.0, 738.0, 399.0, 237.0, 152.0, 113.0, 59.0, 61.0, 48.0, 38.0, 28.0, 14.0, 20.0, 17.0, 12.0, 16.0, 4.0, 6.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07611083984375, -0.07377147674560547, -0.07143211364746094, -0.0690927505493164, -0.06675338745117188, -0.06441402435302734, -0.06207466125488281, -0.05973529815673828, -0.05739593505859375, -0.05505657196044922, -0.05271720886230469, -0.050377845764160156, -0.048038482666015625, -0.045699119567871094, -0.04335975646972656, -0.04102039337158203, -0.0386810302734375, -0.03634166717529297, -0.03400230407714844, -0.031662940979003906, -0.029323577880859375, -0.026984214782714844, -0.024644851684570312, -0.02230548858642578, -0.01996612548828125, -0.01762676239013672, -0.015287399291992188, -0.012948036193847656, -0.010608673095703125, -0.008269309997558594, -0.0059299468994140625, -0.0035905838012695312, -0.001251220703125, 0.0010881423950195312, 0.0034275054931640625, 0.005766868591308594, 0.008106231689453125, 0.010445594787597656, 0.012784957885742188, 0.015124320983886719, 0.01746368408203125, 0.01980304718017578, 0.022142410278320312, 0.024481773376464844, 0.026821136474609375, 0.029160499572753906, 0.03149986267089844, 0.03383922576904297, 0.0361785888671875, 0.03851795196533203, 0.04085731506347656, 0.043196678161621094, 0.045536041259765625, 0.047875404357910156, 0.05021476745605469, 0.05255413055419922, 0.05489349365234375, 0.05723285675048828, 0.05957221984863281, 0.061911582946777344, 0.06425094604492188, 0.0665903091430664, 0.06892967224121094, 0.07126903533935547, 0.0736083984375]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 10.0, 11.0, 22.0, 44.0, 80.0, 131.0, 170.0, 178.0, 152.0, 103.0, 58.0, 29.0, 6.0, 9.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.026106001809239388, -0.02561596967279911, -0.025125939399003983, -0.024635907262563705, -0.024145876988768578, -0.0236558448523283, -0.023165814578533173, -0.022675782442092896, -0.02218575030565262, -0.02169571816921234, -0.021205687895417213, -0.020715655758976936, -0.02022562548518181, -0.01973559334874153, -0.019245563074946404, -0.018755530938506126, -0.018265500664711, -0.01777546852827072, -0.017285438254475594, -0.016795406118035316, -0.01630537584424019, -0.01581534370779991, -0.015325312502682209, -0.014835281297564507, -0.014345250092446804, -0.013855218887329102, -0.013365187682211399, -0.012875156477093697, -0.01238512434065342, -0.011895094066858292, -0.011405061930418015, -0.010915030725300312, -0.01042499952018261, -0.009934968315064907, -0.009444937109947205, -0.008954905904829502, -0.0084648746997118, -0.007974842563271523, -0.00748481135815382, -0.0069947801530361176, -0.006504748947918415, -0.006014717742800713, -0.00552468653768301, -0.00503465486690402, -0.004544623661786318, -0.004054592456668615, -0.003564561018720269, -0.003074529580771923, -0.0025844983756542206, -0.002094467170536518, -0.001604435732588172, -0.0011144044110551476, -0.0006243730895221233, -0.00013434188440442085, 0.0003556895535439253, 0.0008457209914922714, 0.001335752196609974, 0.0018257835181429982, 0.0023158148396760225, 0.0028058462776243687, 0.003295877482742071, 0.0037859086878597736, 0.004275940358638763, 0.004765971563756466, 0.005256002768874168]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 8.0, 17.0, 10.0, 16.0, 14.0, 12.0, 11.0, 17.0, 26.0, 23.0, 31.0, 21.0, 32.0, 49.0, 34.0, 32.0, 32.0, 40.0, 38.0, 33.0, 37.0, 33.0, 30.0, 40.0, 41.0, 31.0, 26.0, 32.0, 28.0, 24.0, 22.0, 17.0, 23.0, 12.0, 11.0, 10.0, 17.0, 8.0, 9.0, 4.0, 7.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.004090428352355957, -0.003963497467339039, -0.0038365665823221207, -0.0037096356973052025, -0.0035827048122882843, -0.003455773927271366, -0.003328843042254448, -0.0032019121572375298, -0.0030749812722206116, -0.0029480503872036934, -0.002821119502186775, -0.002694188617169857, -0.002567257732152939, -0.0024403268471360207, -0.0023133959621191025, -0.0021864650771021843, -0.002059534192085266, -0.001932603307068348, -0.0018056724220514297, -0.0016787415370345116, -0.0015518106520175934, -0.0014248797670006752, -0.001297948881983757, -0.0011710179969668388, -0.0010440871119499207, -0.0009171562269330025, -0.0007902253419160843, -0.0006632944568991661, -0.0005363635718822479, -0.00040943268686532974, -0.00028250180184841156, -0.00015557091683149338, -2.8640031814575195e-05, 9.829085320234299e-05, 0.00022522173821926117, 0.00035215262323617935, 0.00047908350825309753, 0.0006060143932700157, 0.0007329452782869339, 0.0008598761633038521, 0.0009868070483207703, 0.0011137379333376884, 0.0012406688183546066, 0.0013675997033715248, 0.001494530588388443, 0.0016214614734053612, 0.0017483923584222794, 0.0018753232434391975, 0.0020022541284561157, 0.002129185013473034, 0.002256115898489952, 0.0023830467835068703, 0.0025099776685237885, 0.0026369085535407066, 0.002763839438557625, 0.002890770323574543, 0.003017701208591461, 0.0031446320936083794, 0.0032715629786252975, 0.0033984938636422157, 0.003525424748659134, 0.003652355633676052, 0.0037792865186929703, 0.0039062174037098885, 0.004033148288726807]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 2.0, 7.0, 5.0, 6.0, 8.0, 13.0, 4.0, 6.0, 15.0, 21.0, 26.0, 27.0, 28.0, 31.0, 49.0, 47.0, 49.0, 54.0, 49.0, 55.0, 53.0, 54.0, 49.0, 37.0, 33.0, 34.0, 25.0, 35.0, 41.0, 31.0, 15.0, 24.0, 14.0, 11.0, 9.0, 9.0, 6.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.125, -79.7744140625, -77.423828125, -75.0732421875, -72.72265625, -70.3720703125, -68.021484375, -65.6708984375, -63.3203125, -60.9697265625, -58.619140625, -56.2685546875, -53.91796875, -51.5673828125, -49.216796875, -46.8662109375, -44.515625, -42.1650390625, -39.814453125, -37.4638671875, -35.11328125, -32.7626953125, -30.412109375, -28.0615234375, -25.7109375, -23.3603515625, -21.009765625, -18.6591796875, -16.30859375, -13.9580078125, -11.607421875, -9.2568359375, -6.90625, -4.5556640625, -2.205078125, 0.1455078125, 2.49609375, 4.8466796875, 7.197265625, 9.5478515625, 11.8984375, 14.2490234375, 16.599609375, 18.9501953125, 21.30078125, 23.6513671875, 26.001953125, 28.3525390625, 30.703125, 33.0537109375, 35.404296875, 37.7548828125, 40.10546875, 42.4560546875, 44.806640625, 47.1572265625, 49.5078125, 51.8583984375, 54.208984375, 56.5595703125, 58.91015625, 61.2607421875, 63.611328125, 65.9619140625, 68.3125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 3.0, 7.0, 10.0, 8.0, 24.0, 20.0, 33.0, 49.0, 74.0, 115.0, 146.0, 279.0, 600.0, 1133.0, 2467.0, 6135.0, 20896.0, 145084.0, 716042.0, 125757.0, 19017.0, 5829.0, 2297.0, 1087.0, 570.0, 333.0, 176.0, 132.0, 67.0, 42.0, 32.0, 37.0, 15.0, 13.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.546875, -26.770263671875, -25.99365234375, -25.217041015625, -24.4404296875, -23.663818359375, -22.88720703125, -22.110595703125, -21.333984375, -20.557373046875, -19.78076171875, -19.004150390625, -18.2275390625, -17.450927734375, -16.67431640625, -15.897705078125, -15.12109375, -14.344482421875, -13.56787109375, -12.791259765625, -12.0146484375, -11.238037109375, -10.46142578125, -9.684814453125, -8.908203125, -8.131591796875, -7.35498046875, -6.578369140625, -5.8017578125, -5.025146484375, -4.24853515625, -3.471923828125, -2.6953125, -1.918701171875, -1.14208984375, -0.365478515625, 0.4111328125, 1.187744140625, 1.96435546875, 2.740966796875, 3.517578125, 4.294189453125, 5.07080078125, 5.847412109375, 6.6240234375, 7.400634765625, 8.17724609375, 8.953857421875, 9.73046875, 10.507080078125, 11.28369140625, 12.060302734375, 12.8369140625, 13.613525390625, 14.39013671875, 15.166748046875, 15.943359375, 16.719970703125, 17.49658203125, 18.273193359375, 19.0498046875, 19.826416015625, 20.60302734375, 21.379638671875, 22.15625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 10.0, 8.0, 10.0, 17.0, 21.0, 20.0, 35.0, 41.0, 52.0, 48.0, 54.0, 69.0, 66.0, 2090.0, 81.0, 52.0, 68.0, 52.0, 51.0, 43.0, 31.0, 40.0, 23.0, 21.0, 13.0, 12.0, 5.0, 2.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-116.25, -112.04296875, -107.8359375, -103.62890625, -99.421875, -95.21484375, -91.0078125, -86.80078125, -82.59375, -78.38671875, -74.1796875, -69.97265625, -65.765625, -61.55859375, -57.3515625, -53.14453125, -48.9375, -44.73046875, -40.5234375, -36.31640625, -32.109375, -27.90234375, -23.6953125, -19.48828125, -15.28125, -11.07421875, -6.8671875, -2.66015625, 1.546875, 5.75390625, 9.9609375, 14.16796875, 18.375, 22.58203125, 26.7890625, 30.99609375, 35.203125, 39.41015625, 43.6171875, 47.82421875, 52.03125, 56.23828125, 60.4453125, 64.65234375, 68.859375, 73.06640625, 77.2734375, 81.48046875, 85.6875, 89.89453125, 94.1015625, 98.30859375, 102.515625, 106.72265625, 110.9296875, 115.13671875, 119.34375, 123.55078125, 127.7578125, 131.96484375, 136.171875, 140.37890625, 144.5859375, 148.79296875, 153.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 7.0, 12.0, 8.0, 17.0, 17.0, 22.0, 53.0, 60.0, 97.0, 121.0, 186.0, 305.0, 546.0, 1053.0, 3088.0, 20986.0, 845267.0, 2245909.0, 22100.0, 3306.0, 1090.0, 523.0, 284.0, 198.0, 113.0, 113.0, 66.0, 47.0, 32.0, 19.0, 17.0, 11.0, 5.0, 7.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.03125, -34.001220703125, -32.97119140625, -31.941162109375, -30.9111328125, -29.881103515625, -28.85107421875, -27.821044921875, -26.791015625, -25.760986328125, -24.73095703125, -23.700927734375, -22.6708984375, -21.640869140625, -20.61083984375, -19.580810546875, -18.55078125, -17.520751953125, -16.49072265625, -15.460693359375, -14.4306640625, -13.400634765625, -12.37060546875, -11.340576171875, -10.310546875, -9.280517578125, -8.25048828125, -7.220458984375, -6.1904296875, -5.160400390625, -4.13037109375, -3.100341796875, -2.0703125, -1.040283203125, -0.01025390625, 1.019775390625, 2.0498046875, 3.079833984375, 4.10986328125, 5.139892578125, 6.169921875, 7.199951171875, 8.22998046875, 9.260009765625, 10.2900390625, 11.320068359375, 12.35009765625, 13.380126953125, 14.41015625, 15.440185546875, 16.47021484375, 17.500244140625, 18.5302734375, 19.560302734375, 20.59033203125, 21.620361328125, 22.650390625, 23.680419921875, 24.71044921875, 25.740478515625, 26.7705078125, 27.800537109375, 28.83056640625, 29.860595703125, 30.890625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 5.0, 23.0, 51.0, 202.0, 445.0, 198.0, 49.0, 13.0, 10.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.1924285888672, -144.02651977539062, -128.86062622070312, -113.69471740722656, -98.52880859375, -83.36289978027344, -68.1969985961914, -53.031097412109375, -37.86518859863281, -22.699283599853516, -7.533378601074219, 7.632526397705078, 22.798431396484375, 37.96434020996094, 53.13024139404297, 68.296142578125, 83.46205139160156, 98.62796020507812, 113.79386138916016, 128.9597625732422, 144.12567138671875, 159.2915802001953, 174.45748901367188, 189.62338256835938, 204.78929138183594, 219.9552001953125, 235.12109375, 250.28700256347656, 265.4529113769531, 280.61883544921875, 295.78472900390625, 310.95062255859375, 326.11651611328125, 341.28240966796875, 356.4483337402344, 371.6142272949219, 386.7801513671875, 401.946044921875, 417.1119384765625, 432.27783203125, 447.4437561035156, 462.6096496582031, 477.77557373046875, 492.94146728515625, 508.10736083984375, 523.2733154296875, 538.439208984375, 553.6051025390625, 568.77099609375, 583.9368896484375, 599.102783203125, 614.2687377929688, 629.4346313476562, 644.6005249023438, 659.7664184570312, 674.9323120117188, 690.0982666015625, 705.26416015625, 720.4300537109375, 735.5960083007812, 750.7619018554688, 765.9277954101562, 781.0936889648438, 796.2595825195312, 811.4254760742188]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 4.0, 8.0, 6.0, 13.0, 12.0, 12.0, 17.0, 25.0, 31.0, 18.0, 33.0, 41.0, 44.0, 48.0, 50.0, 52.0, 51.0, 56.0, 51.0, 45.0, 35.0, 33.0, 45.0, 36.0, 32.0, 20.0, 35.0, 32.0, 20.0, 22.0, 12.0, 15.0, 6.0, 6.0, 5.0, 2.0, 4.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.28558349609375, -120.87677001953125, -116.46795654296875, -112.05914306640625, -107.65032958984375, -103.24151611328125, -98.83270263671875, -94.42388916015625, -90.01507568359375, -85.60626220703125, -81.19744873046875, -76.78863525390625, -72.37982177734375, -67.97100830078125, -63.562191009521484, -59.153377532958984, -54.74456024169922, -50.33574676513672, -45.92693328857422, -41.51811981201172, -37.10930633544922, -32.70049285888672, -28.291675567626953, -23.882862091064453, -19.474048614501953, -15.065235137939453, -10.656420707702637, -6.24760627746582, -1.8387928009033203, 2.5700206756591797, 6.9788360595703125, 11.387649536132812, 15.796463012695312, 20.205276489257812, 24.614089965820312, 29.022905349731445, 33.43171691894531, 37.84053039550781, 42.24934768676758, 46.65816116333008, 51.06697463989258, 55.47578811645508, 59.88460159301758, 64.29341888427734, 68.70223236083984, 73.11104583740234, 77.51985931396484, 81.92867279052734, 86.33748626708984, 90.74629974365234, 95.15511322021484, 99.56392669677734, 103.97274017333984, 108.38155364990234, 112.79037475585938, 117.19918823242188, 121.60800170898438, 126.01681518554688, 130.42562866210938, 134.83444213867188, 139.24325561523438, 143.65206909179688, 148.06088256835938, 152.46969604492188, 156.87850952148438]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 4.0, 10.0, 15.0, 16.0, 36.0, 31.0, 46.0, 52.0, 81.0, 108.0, 143.0, 175.0, 205.0, 290.0, 363.0, 537.0, 633.0, 891.0, 1041230.0, 899.0, 682.0, 521.0, 358.0, 249.0, 210.0, 174.0, 136.0, 111.0, 104.0, 75.0, 45.0, 27.0, 26.0, 25.0, 10.0, 7.0, 12.0, 2.0, 3.0, 3.0, 8.0, 1.0], "bins": [-59.018165588378906, -57.561302185058594, -56.10443878173828, -54.64757537841797, -53.190711975097656, -51.733848571777344, -50.27698516845703, -48.82012176513672, -47.363258361816406, -45.906394958496094, -44.44953155517578, -42.99266815185547, -41.535804748535156, -40.078941345214844, -38.62207794189453, -37.16521453857422, -35.708351135253906, -34.251487731933594, -32.79462432861328, -31.33776092529297, -29.880897521972656, -28.424034118652344, -26.96717071533203, -25.51030731201172, -24.053443908691406, -22.596580505371094, -21.13971710205078, -19.68285369873047, -18.225990295410156, -16.769126892089844, -15.312263488769531, -13.855400085449219, -12.398536682128906, -10.941673278808594, -9.484809875488281, -8.027946472167969, -6.571083068847656, -5.114219665527344, -3.6573562622070312, -2.2004928588867188, -0.7436294555664062, 0.7132339477539062, 2.1700973510742188, 3.6269607543945312, 5.083824157714844, 6.540687561035156, 7.997550964355469, 9.454414367675781, 10.911277770996094, 12.368141174316406, 13.825004577636719, 15.281867980957031, 16.738731384277344, 18.195594787597656, 19.65245819091797, 21.10932159423828, 22.566184997558594, 24.023048400878906, 25.47991180419922, 26.93677520751953, 28.393638610839844, 29.850502014160156, 31.30736541748047, 32.76422882080078, 34.221092224121094]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 3.0, 8.0, 11.0, 10.0, 2.0, 11.0, 6.0, 10.0, 13.0, 25.0, 31.0, 72.0, 393.0, 51462036.0, 283.0, 71.0, 45.0, 22.0, 20.0, 12.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 5.0, 7.0, 1.0, 9.0, 4.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4100.0, -3933.07421875, -3766.1484375, -3599.22265625, -3432.296875, -3265.37109375, -3098.4453125, -2931.51953125, -2764.59375, -2597.66796875, -2430.7421875, -2263.81640625, -2096.890625, -1929.96484375, -1763.0391845703125, -1596.1134033203125, -1429.187744140625, -1262.261962890625, -1095.336181640625, -928.4104614257812, -761.4846801757812, -594.5588989257812, -427.6331787109375, -260.7073974609375, -93.7816162109375, 73.14414978027344, 240.06991577148438, 406.99566650390625, 573.9214477539062, 740.8472290039062, 907.77294921875, 1074.69873046875, 1241.62451171875, 1408.55029296875, 1575.47607421875, 1742.40185546875, 1909.32763671875, 2076.25341796875, 2243.17919921875, 2410.10498046875, 2577.03076171875, 2743.95654296875, 2910.88232421875, 3077.80810546875, 3244.73388671875, 3411.65966796875, 3578.58544921875, 3745.51123046875, 3912.436767578125, 4079.362548828125, 4246.2880859375, 4413.2138671875, 4580.1396484375, 4747.0654296875, 4913.9912109375, 5080.9169921875, 5247.8427734375, 5414.7685546875, 5581.6943359375, 5748.6201171875, 5915.5458984375, 6082.4716796875, 6249.3974609375, 6416.3232421875, 6583.2490234375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [9.0, 9.0, 9.0, 10.0, 12.0, 35.0, 40.0, 40.0, 53.0, 71.0, 106.0, 146.0, 219.0, 346.0, 455.0, 601.0, 837.0, 1131.0, 1616.0, 2454.0, 3518.0, 5055.0, 7029.0, 10475.0, 15143.0, 21720.0, 32045.0, 46824.0, 70832.0, 108914.0, 174532.0, 316677.0, 1165759.0, 3372199.0, 373855.0, 196041.0, 119659.0, 78579.0, 51875.0, 34980.0, 24130.0, 16110.0, 11384.0, 7697.0, 5329.0, 3846.0, 2777.0, 1804.0, 1197.0, 917.0, 670.0, 469.0, 343.0, 262.0, 179.0, 111.0, 83.0, 66.0, 45.0, 21.0, 28.0, 38.0, 27.0, 13.0], "bins": [-5.703125, -5.5308837890625, -5.358642578125, -5.1864013671875, -5.01416015625, -4.8419189453125, -4.669677734375, -4.4974365234375, -4.3251953125, -4.1529541015625, -3.980712890625, -3.8084716796875, -3.63623046875, -3.4639892578125, -3.291748046875, -3.1195068359375, -2.947265625, -2.7750244140625, -2.602783203125, -2.4305419921875, -2.25830078125, -2.0860595703125, -1.913818359375, -1.7415771484375, -1.5693359375, -1.3970947265625, -1.224853515625, -1.0526123046875, -0.88037109375, -0.7081298828125, -0.535888671875, -0.3636474609375, -0.19140625, -0.0191650390625, 0.153076171875, 0.3253173828125, 0.49755859375, 0.6697998046875, 0.842041015625, 1.0142822265625, 1.1865234375, 1.3587646484375, 1.531005859375, 1.7032470703125, 1.87548828125, 2.0477294921875, 2.219970703125, 2.3922119140625, 2.564453125, 2.7366943359375, 2.908935546875, 3.0811767578125, 3.25341796875, 3.4256591796875, 3.597900390625, 3.7701416015625, 3.9423828125, 4.1146240234375, 4.286865234375, 4.4591064453125, 4.63134765625, 4.8035888671875, 4.975830078125, 5.1480712890625, 5.3203125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 7.0, 8.0, 13.0, 11.0, 15.0, 11.0, 12.0, 30.0, 18.0, 26.0, 25.0, 31.0, 22.0, 30.0, 32.0, 34.0, 51.0, 39.0, 76.0, 128.0, 521.0, 349.0, 88.0, 42.0, 43.0, 34.0, 30.0, 31.0, 27.0, 24.0, 30.0, 21.0, 20.0, 13.0, 16.0, 15.0, 14.0, 9.0, 10.0, 8.0, 3.0, 11.0, 10.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-12.1015625, -11.71044921875, -11.3193359375, -10.92822265625, -10.537109375, -10.14599609375, -9.7548828125, -9.36376953125, -8.97265625, -8.58154296875, -8.1904296875, -7.79931640625, -7.408203125, -7.01708984375, -6.6259765625, -6.23486328125, -5.84375, -5.45263671875, -5.0615234375, -4.67041015625, -4.279296875, -3.88818359375, -3.4970703125, -3.10595703125, -2.71484375, -2.32373046875, -1.9326171875, -1.54150390625, -1.150390625, -0.75927734375, -0.3681640625, 0.02294921875, 0.4140625, 0.80517578125, 1.1962890625, 1.58740234375, 1.978515625, 2.36962890625, 2.7607421875, 3.15185546875, 3.54296875, 3.93408203125, 4.3251953125, 4.71630859375, 5.107421875, 5.49853515625, 5.8896484375, 6.28076171875, 6.671875, 7.06298828125, 7.4541015625, 7.84521484375, 8.236328125, 8.62744140625, 9.0185546875, 9.40966796875, 9.80078125, 10.19189453125, 10.5830078125, 10.97412109375, 11.365234375, 11.75634765625, 12.1474609375, 12.53857421875, 12.9296875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 7.0, 9.0, 21.0, 18.0, 13.0, 27.0, 31.0, 45.0, 61.0, 111.0, 147.0, 239.0, 315.0, 524.0, 631.0, 1079.0, 1530.0, 2379.0, 3415.0, 5499.0, 8195.0, 12839.0, 19587.0, 31023.0, 48066.0, 76392.0, 127840.0, 231376.0, 568461.0, 3984057.0, 588223.0, 235389.0, 129041.0, 78114.0, 48176.0, 31108.0, 19840.0, 13002.0, 8204.0, 5586.0, 3421.0, 2477.0, 1632.0, 1045.0, 637.0, 451.0, 385.0, 213.0, 199.0, 116.0, 79.0, 56.0, 44.0, 14.0, 17.0, 11.0, 8.0, 12.0, 7.0, 5.0, 4.0], "bins": [-6.953125, -6.7392578125, -6.525390625, -6.3115234375, -6.09765625, -5.8837890625, -5.669921875, -5.4560546875, -5.2421875, -5.0283203125, -4.814453125, -4.6005859375, -4.38671875, -4.1728515625, -3.958984375, -3.7451171875, -3.53125, -3.3173828125, -3.103515625, -2.8896484375, -2.67578125, -2.4619140625, -2.248046875, -2.0341796875, -1.8203125, -1.6064453125, -1.392578125, -1.1787109375, -0.96484375, -0.7509765625, -0.537109375, -0.3232421875, -0.109375, 0.1044921875, 0.318359375, 0.5322265625, 0.74609375, 0.9599609375, 1.173828125, 1.3876953125, 1.6015625, 1.8154296875, 2.029296875, 2.2431640625, 2.45703125, 2.6708984375, 2.884765625, 3.0986328125, 3.3125, 3.5263671875, 3.740234375, 3.9541015625, 4.16796875, 4.3818359375, 4.595703125, 4.8095703125, 5.0234375, 5.2373046875, 5.451171875, 5.6650390625, 5.87890625, 6.0927734375, 6.306640625, 6.5205078125, 6.734375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 7.0, 10.0, 4.0, 12.0, 18.0, 16.0, 15.0, 26.0, 21.0, 26.0, 29.0, 25.0, 30.0, 49.0, 35.0, 51.0, 82.0, 136.0, 434.0, 433.0, 120.0, 60.0, 41.0, 45.0, 27.0, 41.0, 38.0, 25.0, 24.0, 25.0, 30.0, 20.0, 19.0, 17.0, 7.0, 11.0, 1.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6875, -10.34326171875, -9.9990234375, -9.65478515625, -9.310546875, -8.96630859375, -8.6220703125, -8.27783203125, -7.93359375, -7.58935546875, -7.2451171875, -6.90087890625, -6.556640625, -6.21240234375, -5.8681640625, -5.52392578125, -5.1796875, -4.83544921875, -4.4912109375, -4.14697265625, -3.802734375, -3.45849609375, -3.1142578125, -2.77001953125, -2.42578125, -2.08154296875, -1.7373046875, -1.39306640625, -1.048828125, -0.70458984375, -0.3603515625, -0.01611328125, 0.328125, 0.67236328125, 1.0166015625, 1.36083984375, 1.705078125, 2.04931640625, 2.3935546875, 2.73779296875, 3.08203125, 3.42626953125, 3.7705078125, 4.11474609375, 4.458984375, 4.80322265625, 5.1474609375, 5.49169921875, 5.8359375, 6.18017578125, 6.5244140625, 6.86865234375, 7.212890625, 7.55712890625, 7.9013671875, 8.24560546875, 8.58984375, 8.93408203125, 9.2783203125, 9.62255859375, 9.966796875, 10.31103515625, 10.6552734375, 10.99951171875, 11.34375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 11.0, 26.0, 25.0, 19.0, 37.0, 60.0, 95.0, 98.0, 125.0, 156.0, 202.0, 312.0, 429.0, 676.0, 953.0, 1474.0, 2465.0, 4298.0, 8034.0, 19268.0, 61893.0, 5863292.0, 255682.0, 41083.0, 14580.0, 6540.0, 3290.0, 2019.0, 1236.0, 929.0, 592.0, 426.0, 254.0, 252.0, 169.0, 129.0, 82.0, 41.0, 52.0, 43.0, 24.0, 16.0, 7.0, 8.0, 8.0, 5.0, 8.0, 2.0, 0.0, 5.0, 1.0, 6.0], "bins": [-26.3125, -25.53515625, -24.7578125, -23.98046875, -23.203125, -22.42578125, -21.6484375, -20.87109375, -20.09375, -19.31640625, -18.5390625, -17.76171875, -16.984375, -16.20703125, -15.4296875, -14.65234375, -13.875, -13.09765625, -12.3203125, -11.54296875, -10.765625, -9.98828125, -9.2109375, -8.43359375, -7.65625, -6.87890625, -6.1015625, -5.32421875, -4.546875, -3.76953125, -2.9921875, -2.21484375, -1.4375, -0.66015625, 0.1171875, 0.89453125, 1.671875, 2.44921875, 3.2265625, 4.00390625, 4.78125, 5.55859375, 6.3359375, 7.11328125, 7.890625, 8.66796875, 9.4453125, 10.22265625, 11.0, 11.77734375, 12.5546875, 13.33203125, 14.109375, 14.88671875, 15.6640625, 16.44140625, 17.21875, 17.99609375, 18.7734375, 19.55078125, 20.328125, 21.10546875, 21.8828125, 22.66015625, 23.4375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 8.0, 12.0, 12.0, 16.0, 17.0, 13.0, 21.0, 17.0, 33.0, 30.0, 41.0, 33.0, 33.0, 60.0, 61.0, 87.0, 160.0, 417.0, 377.0, 137.0, 66.0, 52.0, 58.0, 37.0, 43.0, 38.0, 20.0, 24.0, 20.0, 12.0, 13.0, 11.0, 8.0, 8.0, 5.0, 5.0, 8.0, 5.0, 3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-9.234375, -8.977783203125, -8.72119140625, -8.464599609375, -8.2080078125, -7.951416015625, -7.69482421875, -7.438232421875, -7.181640625, -6.925048828125, -6.66845703125, -6.411865234375, -6.1552734375, -5.898681640625, -5.64208984375, -5.385498046875, -5.12890625, -4.872314453125, -4.61572265625, -4.359130859375, -4.1025390625, -3.845947265625, -3.58935546875, -3.332763671875, -3.076171875, -2.819580078125, -2.56298828125, -2.306396484375, -2.0498046875, -1.793212890625, -1.53662109375, -1.280029296875, -1.0234375, -0.766845703125, -0.51025390625, -0.253662109375, 0.0029296875, 0.259521484375, 0.51611328125, 0.772705078125, 1.029296875, 1.285888671875, 1.54248046875, 1.799072265625, 2.0556640625, 2.312255859375, 2.56884765625, 2.825439453125, 3.08203125, 3.338623046875, 3.59521484375, 3.851806640625, 4.1083984375, 4.364990234375, 4.62158203125, 4.878173828125, 5.134765625, 5.391357421875, 5.64794921875, 5.904541015625, 6.1611328125, 6.417724609375, 6.67431640625, 6.930908203125, 7.1875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 5.0, 4.0, 1.0, 6.0, 8.0, 13.0, 32.0, 62.0, 123.0, 380.0, 206.0, 80.0, 42.0, 22.0, 8.0, 8.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-55.1705322265625, -54.083412170410156, -52.99629592895508, -51.909175872802734, -50.82205581665039, -49.73493576049805, -48.64781951904297, -47.560699462890625, -46.47357940673828, -45.38645935058594, -44.29934310913086, -43.212223052978516, -42.12510299682617, -41.03798294067383, -39.95086669921875, -38.863746643066406, -37.77662658691406, -36.68950653076172, -35.60239028930664, -34.5152702331543, -33.42815017700195, -32.34103012084961, -31.25391387939453, -30.166793823242188, -29.07967758178711, -27.9925594329834, -26.905439376831055, -25.818321228027344, -24.731201171875, -23.64408302307129, -22.556964874267578, -21.469844818115234, -20.382726669311523, -19.295608520507812, -18.20848846435547, -17.121370315551758, -16.034250259399414, -14.947132110595703, -13.860013008117676, -12.772893905639648, -11.685774803161621, -10.598655700683594, -9.511536598205566, -8.424417495727539, -7.33729887008667, -6.250179767608643, -5.163061141967773, -4.075942039489746, -2.9888229370117188, -1.901703953742981, -0.8145849704742432, 0.2725338935852051, 1.3596529960632324, 2.4467720985412598, 3.533890724182129, 4.621009826660156, 5.708128929138184, 6.795248031616211, 7.882367134094238, 8.969486236572266, 10.056604385375977, 11.14372444152832, 12.230842590332031, 13.317961692810059, 14.405080795288086]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 2.0, 7.0, 11.0, 11.0, 11.0, 14.0, 18.0, 19.0, 21.0, 27.0, 25.0, 34.0, 34.0, 41.0, 33.0, 35.0, 47.0, 35.0, 40.0, 43.0, 55.0, 50.0, 45.0, 39.0, 34.0, 26.0, 36.0, 34.0, 29.0, 17.0, 17.0, 20.0, 10.0, 19.0, 16.0, 13.0, 5.0, 3.0, 4.0, 3.0, 5.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.46691608428955, -10.115336418151855, -9.763757705688477, -9.412178039550781, -9.060599327087402, -8.709019660949707, -8.357440948486328, -8.005861282348633, -7.654282093048096, -7.302702903747559, -6.9511237144470215, -6.599544525146484, -6.247964859008789, -5.89638614654541, -5.544806480407715, -5.193227291107178, -4.841648101806641, -4.4900689125061035, -4.138489723205566, -3.78691029548645, -3.435331106185913, -3.083751916885376, -2.7321724891662598, -2.3805932998657227, -2.0290141105651855, -1.6774349212646484, -1.3258556127548218, -0.9742763042449951, -0.622697114944458, -0.2711179256439209, 0.08046150207519531, 0.4320406913757324, 0.7836189270019531, 1.1351981163024902, 1.486777424812317, 1.8383567333221436, 2.1899359226226807, 2.5415151119232178, 2.893094539642334, 3.244673728942871, 3.596252918243408, 3.9478321075439453, 4.299411296844482, 4.6509904861450195, 5.002570152282715, 5.354148864746094, 5.705728530883789, 6.057307720184326, 6.408886909484863, 6.7604660987854, 7.1120452880859375, 7.463624954223633, 7.815203666687012, 8.166783332824707, 8.518362045288086, 8.869941711425781, 9.221521377563477, 9.573101043701172, 9.92467975616455, 10.276259422302246, 10.627838134765625, 10.97941780090332, 11.330997467041016, 11.682576179504395, 12.034154891967773]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 7.0, 7.0, 6.0, 13.0, 20.0, 20.0, 28.0, 30.0, 40.0, 55.0, 62.0, 127.0, 147.0, 255.0, 287.0, 494.0, 675.0, 1180.0, 1879.0, 3148.0, 5614.0, 11539.0, 27555.0, 120627.0, 3911227.0, 66885.0, 21137.0, 9313.0, 4711.0, 2649.0, 1547.0, 1001.0, 617.0, 415.0, 250.0, 174.0, 150.0, 96.0, 82.0, 53.0, 33.0, 40.0, 21.0, 16.0, 11.0, 12.0, 8.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0], "bins": [-0.0309906005859375, -0.030060529708862305, -0.02913045883178711, -0.028200387954711914, -0.02727031707763672, -0.026340246200561523, -0.025410175323486328, -0.024480104446411133, -0.023550033569335938, -0.022619962692260742, -0.021689891815185547, -0.02075982093811035, -0.019829750061035156, -0.01889967918395996, -0.017969608306884766, -0.01703953742980957, -0.016109466552734375, -0.01517939567565918, -0.014249324798583984, -0.013319253921508789, -0.012389183044433594, -0.011459112167358398, -0.010529041290283203, -0.009598970413208008, -0.008668899536132812, -0.007738828659057617, -0.006808757781982422, -0.0058786869049072266, -0.004948616027832031, -0.004018545150756836, -0.0030884742736816406, -0.0021584033966064453, -0.00122833251953125, -0.0002982616424560547, 0.0006318092346191406, 0.001561880111694336, 0.0024919509887695312, 0.0034220218658447266, 0.004352092742919922, 0.005282163619995117, 0.0062122344970703125, 0.007142305374145508, 0.008072376251220703, 0.009002447128295898, 0.009932518005371094, 0.010862588882446289, 0.011792659759521484, 0.01272273063659668, 0.013652801513671875, 0.01458287239074707, 0.015512943267822266, 0.01644301414489746, 0.017373085021972656, 0.01830315589904785, 0.019233226776123047, 0.020163297653198242, 0.021093368530273438, 0.022023439407348633, 0.022953510284423828, 0.023883581161499023, 0.02481365203857422, 0.025743722915649414, 0.02667379379272461, 0.027603864669799805, 0.028533935546875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 8.0, 7.0, 13.0, 11.0, 12.0, 20.0, 328.0, 473.0, 18.0, 14.0, 20.0, 6.0, 6.0, 8.0, 9.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0047454833984375, -0.004606425762176514, -0.004467368125915527, -0.004328310489654541, -0.004189252853393555, -0.004050195217132568, -0.003911137580871582, -0.0037720799446105957, -0.0036330223083496094, -0.003493964672088623, -0.0033549070358276367, -0.0032158493995666504, -0.003076791763305664, -0.0029377341270446777, -0.0027986764907836914, -0.002659618854522705, -0.0025205612182617188, -0.0023815035820007324, -0.002242445945739746, -0.0021033883094787598, -0.0019643306732177734, -0.0018252730369567871, -0.0016862154006958008, -0.0015471577644348145, -0.0014081001281738281, -0.0012690424919128418, -0.0011299848556518555, -0.0009909272193908691, -0.0008518695831298828, -0.0007128119468688965, -0.0005737543106079102, -0.00043469667434692383, -0.0002956390380859375, -0.00015658140182495117, -1.7523765563964844e-05, 0.00012153387069702148, 0.0002605915069580078, 0.00039964914321899414, 0.0005387067794799805, 0.0006777644157409668, 0.0008168220520019531, 0.0009558796882629395, 0.0010949373245239258, 0.0012339949607849121, 0.0013730525970458984, 0.0015121102333068848, 0.001651167869567871, 0.0017902255058288574, 0.0019292831420898438, 0.00206834077835083, 0.0022073984146118164, 0.0023464560508728027, 0.002485513687133789, 0.0026245713233947754, 0.0027636289596557617, 0.002902686595916748, 0.0030417442321777344, 0.0031808018684387207, 0.003319859504699707, 0.0034589171409606934, 0.0035979747772216797, 0.003737032413482666, 0.0038760900497436523, 0.004015147686004639, 0.004154205322265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 5.0, 26.0, 13.0, 23.0, 29.0, 41.0, 60.0, 122.0, 135.0, 199.0, 381.0, 635.0, 1137.0, 2473.0, 5750.0, 17211.0, 70687.0, 597681.0, 3269658.0, 178135.0, 33029.0, 9607.0, 3564.0, 1619.0, 785.0, 502.0, 239.0, 151.0, 89.0, 91.0, 56.0, 46.0, 29.0, 21.0, 13.0, 14.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03668212890625, -0.03546953201293945, -0.034256935119628906, -0.03304433822631836, -0.03183174133300781, -0.030619144439697266, -0.02940654754638672, -0.028193950653076172, -0.026981353759765625, -0.025768756866455078, -0.02455615997314453, -0.023343563079833984, -0.022130966186523438, -0.02091836929321289, -0.019705772399902344, -0.018493175506591797, -0.01728057861328125, -0.016067981719970703, -0.014855384826660156, -0.01364278793334961, -0.012430191040039062, -0.011217594146728516, -0.010004997253417969, -0.008792400360107422, -0.007579803466796875, -0.006367206573486328, -0.005154609680175781, -0.003942012786865234, -0.0027294158935546875, -0.0015168190002441406, -0.00030422210693359375, 0.0009083747863769531, 0.0021209716796875, 0.003333568572998047, 0.004546165466308594, 0.005758762359619141, 0.0069713592529296875, 0.008183956146240234, 0.009396553039550781, 0.010609149932861328, 0.011821746826171875, 0.013034343719482422, 0.014246940612792969, 0.015459537506103516, 0.016672134399414062, 0.01788473129272461, 0.019097328186035156, 0.020309925079345703, 0.02152252197265625, 0.022735118865966797, 0.023947715759277344, 0.02516031265258789, 0.026372909545898438, 0.027585506439208984, 0.02879810333251953, 0.030010700225830078, 0.031223297119140625, 0.03243589401245117, 0.03364849090576172, 0.034861087799072266, 0.03607368469238281, 0.03728628158569336, 0.038498878479003906, 0.03971147537231445, 0.040924072265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 1.0, 1.0, 4.0, 4.0, 6.0, 5.0, 14.0, 9.0, 9.0, 14.0, 23.0, 32.0, 40.0, 64.0, 46.0, 61.0, 97.0, 108.0, 121.0, 180.0, 271.0, 470.0, 993.0, 421.0, 237.0, 170.0, 146.0, 83.0, 86.0, 74.0, 52.0, 44.0, 40.0, 28.0, 21.0, 20.0, 16.0, 22.0, 13.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 5.0], "bins": [-0.0069122314453125, -0.006727397441864014, -0.006542563438415527, -0.006357729434967041, -0.006172895431518555, -0.005988061428070068, -0.005803227424621582, -0.005618393421173096, -0.005433559417724609, -0.005248725414276123, -0.005063891410827637, -0.00487905740737915, -0.004694223403930664, -0.004509389400482178, -0.004324555397033691, -0.004139721393585205, -0.003954887390136719, -0.0037700533866882324, -0.003585219383239746, -0.0034003853797912598, -0.0032155513763427734, -0.003030717372894287, -0.0028458833694458008, -0.0026610493659973145, -0.002476215362548828, -0.002291381359100342, -0.0021065473556518555, -0.0019217133522033691, -0.0017368793487548828, -0.0015520453453063965, -0.0013672113418579102, -0.0011823773384094238, -0.0009975433349609375, -0.0008127093315124512, -0.0006278753280639648, -0.0004430413246154785, -0.0002582073211669922, -7.337331771850586e-05, 0.00011146068572998047, 0.0002962946891784668, 0.0004811286926269531, 0.0006659626960754395, 0.0008507966995239258, 0.0010356307029724121, 0.0012204647064208984, 0.0014052987098693848, 0.001590132713317871, 0.0017749667167663574, 0.0019598007202148438, 0.00214463472366333, 0.0023294687271118164, 0.0025143027305603027, 0.002699136734008789, 0.0028839707374572754, 0.0030688047409057617, 0.003253638744354248, 0.0034384727478027344, 0.0036233067512512207, 0.003808140754699707, 0.003992974758148193, 0.00417780876159668, 0.004362642765045166, 0.004547476768493652, 0.004732310771942139, 0.004917144775390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 12.0, 19.0, 92.0, 302.0, 371.0, 131.0, 46.0, 14.0, 10.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.24027228355407715, -0.23506303131580353, -0.2298537790775299, -0.2246445268392563, -0.21943527460098267, -0.21422600746154785, -0.20901675522327423, -0.2038075029850006, -0.198598250746727, -0.19338899850845337, -0.18817974627017975, -0.18297049403190613, -0.1777612268924713, -0.1725519746541977, -0.16734272241592407, -0.16213347017765045, -0.15692421793937683, -0.1517149657011032, -0.1465057134628296, -0.14129646122455597, -0.13608720898628235, -0.13087794184684753, -0.1256686896085739, -0.12045943737030029, -0.11525018513202667, -0.11004093289375305, -0.10483168065547943, -0.09962242096662521, -0.09441316872835159, -0.08920391649007797, -0.08399465680122375, -0.07878540456295013, -0.07357613742351532, -0.0683668851852417, -0.06315763294696808, -0.05794837325811386, -0.05273912101984024, -0.04752986878156662, -0.0423206128180027, -0.03711135685443878, -0.03190210461616516, -0.02669285051524639, -0.02148359641432762, -0.01627434231340885, -0.011065088212490082, -0.005855834111571312, -0.0006465800106525421, 0.004562675952911377, 0.009771928191184998, 0.014981182292103767, 0.020190436393022537, 0.025399690493941307, 0.030608944594860077, 0.0358181968331337, 0.04102745279669762, 0.046236708760261536, 0.051445960998535156, 0.05665521323680878, 0.061864469200372696, 0.06707372516393661, 0.07228297740221024, 0.07749222964048386, 0.08270148932933807, 0.0879107415676117, 0.09311999380588531]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 6.0, 12.0, 16.0, 13.0, 17.0, 18.0, 19.0, 21.0, 31.0, 29.0, 44.0, 42.0, 45.0, 50.0, 51.0, 52.0, 59.0, 49.0, 52.0, 56.0, 35.0, 51.0, 29.0, 34.0, 28.0, 23.0, 22.0, 18.0, 20.0, 12.0, 12.0, 6.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.038920819759368896, -0.037841327488422394, -0.03676183521747589, -0.03568234294652939, -0.034602850675582886, -0.03352335840463638, -0.03244386613368988, -0.03136437386274338, -0.030284881591796875, -0.029205389320850372, -0.02812589704990387, -0.027046404778957367, -0.025966912508010864, -0.02488742023706436, -0.02380792796611786, -0.022728435695171356, -0.021648943424224854, -0.02056945115327835, -0.019489958882331848, -0.018410466611385345, -0.017330974340438843, -0.01625148206949234, -0.015171989798545837, -0.014092497527599335, -0.013013005256652832, -0.01193351298570633, -0.010854020714759827, -0.009774528443813324, -0.008695036172866821, -0.007615543901920319, -0.006536051630973816, -0.005456559360027313, -0.0043770670890808105, -0.003297574818134308, -0.002218082547187805, -0.0011385902762413025, -5.9098005294799805e-05, 0.0010203942656517029, 0.0020998865365982056, 0.0031793788075447083, 0.004258871078491211, 0.005338363349437714, 0.006417855620384216, 0.007497347891330719, 0.008576840162277222, 0.009656332433223724, 0.010735824704170227, 0.01181531697511673, 0.012894809246063232, 0.013974301517009735, 0.015053793787956238, 0.01613328605890274, 0.017212778329849243, 0.018292270600795746, 0.01937176287174225, 0.02045125514268875, 0.021530747413635254, 0.022610239684581757, 0.02368973195552826, 0.024769224226474762, 0.025848716497421265, 0.026928208768367767, 0.02800770103931427, 0.029087193310260773, 0.030166685581207275]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 7.0, 6.0, 14.0, 12.0, 18.0, 25.0, 38.0, 36.0, 69.0, 99.0, 157.0, 184.0, 307.0, 464.0, 728.0, 1154.0, 1971.0, 3471.0, 6378.0, 14309.0, 55079.0, 872036.0, 61522.0, 14757.0, 6721.0, 3501.0, 1991.0, 1324.0, 715.0, 474.0, 309.0, 210.0, 146.0, 95.0, 60.0, 50.0, 35.0, 22.0, 16.0, 12.0, 7.0, 6.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04827880859375, -0.04679441452026367, -0.045310020446777344, -0.043825626373291016, -0.04234123229980469, -0.04085683822631836, -0.03937244415283203, -0.0378880500793457, -0.036403656005859375, -0.03491926193237305, -0.03343486785888672, -0.03195047378540039, -0.030466079711914062, -0.028981685638427734, -0.027497291564941406, -0.026012897491455078, -0.02452850341796875, -0.023044109344482422, -0.021559715270996094, -0.020075321197509766, -0.018590927124023438, -0.01710653305053711, -0.015622138977050781, -0.014137744903564453, -0.012653350830078125, -0.011168956756591797, -0.009684562683105469, -0.00820016860961914, -0.0067157745361328125, -0.005231380462646484, -0.0037469863891601562, -0.002262592315673828, -0.0007781982421875, 0.0007061958312988281, 0.0021905899047851562, 0.0036749839782714844, 0.0051593780517578125, 0.006643772125244141, 0.008128166198730469, 0.009612560272216797, 0.011096954345703125, 0.012581348419189453, 0.014065742492675781, 0.01555013656616211, 0.017034530639648438, 0.018518924713134766, 0.020003318786621094, 0.021487712860107422, 0.02297210693359375, 0.024456501007080078, 0.025940895080566406, 0.027425289154052734, 0.028909683227539062, 0.03039407730102539, 0.03187847137451172, 0.03336286544799805, 0.034847259521484375, 0.0363316535949707, 0.03781604766845703, 0.03930044174194336, 0.04078483581542969, 0.042269229888916016, 0.043753623962402344, 0.04523801803588867, 0.046722412109375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 0.0, 5.0, 4.0, 7.0, 5.0, 8.0, 5.0, 13.0, 16.0, 26.0, 74.0, 232.0, 323.0, 152.0, 44.0, 19.0, 9.0, 8.0, 13.0, 4.0, 3.0, 7.0, 2.0, 8.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00499725341796875, -0.004859566688537598, -0.004721879959106445, -0.004584193229675293, -0.004446506500244141, -0.004308819770812988, -0.004171133041381836, -0.004033446311950684, -0.0038957595825195312, -0.003758072853088379, -0.0036203861236572266, -0.0034826993942260742, -0.003345012664794922, -0.0032073259353637695, -0.003069639205932617, -0.002931952476501465, -0.0027942657470703125, -0.00265657901763916, -0.002518892288208008, -0.0023812055587768555, -0.002243518829345703, -0.0021058320999145508, -0.0019681453704833984, -0.001830458641052246, -0.0016927719116210938, -0.0015550851821899414, -0.001417398452758789, -0.0012797117233276367, -0.0011420249938964844, -0.001004338264465332, -0.0008666515350341797, -0.0007289648056030273, -0.000591278076171875, -0.00045359134674072266, -0.0003159046173095703, -0.00017821788787841797, -4.0531158447265625e-05, 9.715557098388672e-05, 0.00023484230041503906, 0.0003725290298461914, 0.0005102157592773438, 0.0006479024887084961, 0.0007855892181396484, 0.0009232759475708008, 0.0010609626770019531, 0.0011986494064331055, 0.0013363361358642578, 0.0014740228652954102, 0.0016117095947265625, 0.0017493963241577148, 0.0018870830535888672, 0.0020247697830200195, 0.002162456512451172, 0.0023001432418823242, 0.0024378299713134766, 0.002575516700744629, 0.0027132034301757812, 0.0028508901596069336, 0.002988576889038086, 0.0031262636184692383, 0.0032639503479003906, 0.003401637077331543, 0.0035393238067626953, 0.0036770105361938477, 0.003814697265625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 3.0, 4.0, 10.0, 15.0, 19.0, 23.0, 36.0, 52.0, 60.0, 79.0, 112.0, 161.0, 283.0, 373.0, 514.0, 808.0, 1463.0, 2441.0, 5042.0, 14291.0, 104588.0, 849797.0, 48630.0, 10067.0, 4027.0, 2128.0, 1230.0, 670.0, 500.0, 369.0, 237.0, 145.0, 112.0, 76.0, 46.0, 39.0, 30.0, 26.0, 9.0, 11.0, 11.0, 4.0, 6.0, 1.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06439208984375, -0.062198638916015625, -0.06000518798828125, -0.057811737060546875, -0.0556182861328125, -0.053424835205078125, -0.05123138427734375, -0.049037933349609375, -0.046844482421875, -0.044651031494140625, -0.04245758056640625, -0.040264129638671875, -0.0380706787109375, -0.035877227783203125, -0.03368377685546875, -0.031490325927734375, -0.029296875, -0.027103424072265625, -0.02490997314453125, -0.022716522216796875, -0.0205230712890625, -0.018329620361328125, -0.01613616943359375, -0.013942718505859375, -0.011749267578125, -0.009555816650390625, -0.00736236572265625, -0.005168914794921875, -0.0029754638671875, -0.000782012939453125, 0.00141143798828125, 0.003604888916015625, 0.00579833984375, 0.007991790771484375, 0.01018524169921875, 0.012378692626953125, 0.0145721435546875, 0.016765594482421875, 0.01895904541015625, 0.021152496337890625, 0.023345947265625, 0.025539398193359375, 0.02773284912109375, 0.029926300048828125, 0.0321197509765625, 0.034313201904296875, 0.03650665283203125, 0.038700103759765625, 0.0408935546875, 0.043087005615234375, 0.04528045654296875, 0.047473907470703125, 0.0496673583984375, 0.051860809326171875, 0.05405426025390625, 0.056247711181640625, 0.058441162109375, 0.060634613037109375, 0.06282806396484375, 0.06502151489257812, 0.0672149658203125, 0.06940841674804688, 0.07160186767578125, 0.07379531860351562, 0.07598876953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 9.0, 14.0, 17.0, 11.0, 17.0, 13.0, 19.0, 15.0, 23.0, 12.0, 24.0, 35.0, 33.0, 33.0, 39.0, 45.0, 42.0, 44.0, 47.0, 42.0, 31.0, 33.0, 47.0, 33.0, 32.0, 30.0, 24.0, 33.0, 25.0, 19.0, 25.0, 19.0, 17.0, 20.0, 18.0, 9.0, 10.0, 6.0, 5.0, 4.0, 5.0, 4.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01496124267578125, -0.014462113380432129, -0.013962984085083008, -0.013463854789733887, -0.012964725494384766, -0.012465596199035645, -0.011966466903686523, -0.011467337608337402, -0.010968208312988281, -0.01046907901763916, -0.009969949722290039, -0.009470820426940918, -0.008971691131591797, -0.008472561836242676, -0.007973432540893555, -0.007474303245544434, -0.0069751739501953125, -0.006476044654846191, -0.00597691535949707, -0.005477786064147949, -0.004978656768798828, -0.004479527473449707, -0.003980398178100586, -0.003481268882751465, -0.0029821395874023438, -0.0024830102920532227, -0.0019838809967041016, -0.0014847517013549805, -0.0009856224060058594, -0.0004864931106567383, 1.2636184692382812e-05, 0.0005117654800415039, 0.001010894775390625, 0.001510024070739746, 0.002009153366088867, 0.0025082826614379883, 0.0030074119567871094, 0.0035065412521362305, 0.0040056705474853516, 0.004504799842834473, 0.005003929138183594, 0.005503058433532715, 0.006002187728881836, 0.006501317024230957, 0.007000446319580078, 0.007499575614929199, 0.00799870491027832, 0.008497834205627441, 0.008996963500976562, 0.009496092796325684, 0.009995222091674805, 0.010494351387023926, 0.010993480682373047, 0.011492609977722168, 0.011991739273071289, 0.01249086856842041, 0.012989997863769531, 0.013489127159118652, 0.013988256454467773, 0.014487385749816895, 0.014986515045166016, 0.015485644340515137, 0.015984773635864258, 0.01648390293121338, 0.0169830322265625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 9.0, 11.0, 17.0, 19.0, 26.0, 38.0, 52.0, 79.0, 128.0, 164.0, 292.0, 539.0, 1053.0, 2242.0, 7074.0, 54861.0, 940969.0, 31376.0, 5455.0, 1946.0, 920.0, 457.0, 286.0, 163.0, 106.0, 69.0, 48.0, 32.0, 29.0, 17.0, 19.0, 11.0, 12.0, 4.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0633544921875, -0.06151294708251953, -0.05967140197753906, -0.057829856872558594, -0.055988311767578125, -0.054146766662597656, -0.05230522155761719, -0.05046367645263672, -0.04862213134765625, -0.04678058624267578, -0.04493904113769531, -0.043097496032714844, -0.041255950927734375, -0.039414405822753906, -0.03757286071777344, -0.03573131561279297, -0.0338897705078125, -0.03204822540283203, -0.030206680297851562, -0.028365135192871094, -0.026523590087890625, -0.024682044982910156, -0.022840499877929688, -0.02099895477294922, -0.01915740966796875, -0.01731586456298828, -0.015474319458007812, -0.013632774353027344, -0.011791229248046875, -0.009949684143066406, -0.008108139038085938, -0.006266593933105469, -0.004425048828125, -0.0025835037231445312, -0.0007419586181640625, 0.0010995864868164062, 0.002941131591796875, 0.004782676696777344, 0.0066242218017578125, 0.008465766906738281, 0.01030731201171875, 0.012148857116699219, 0.013990402221679688, 0.015831947326660156, 0.017673492431640625, 0.019515037536621094, 0.021356582641601562, 0.02319812774658203, 0.0250396728515625, 0.02688121795654297, 0.028722763061523438, 0.030564308166503906, 0.032405853271484375, 0.034247398376464844, 0.03608894348144531, 0.03793048858642578, 0.03977203369140625, 0.04161357879638672, 0.04345512390136719, 0.045296669006347656, 0.047138214111328125, 0.048979759216308594, 0.05082130432128906, 0.05266284942626953, 0.05450439453125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 12.0, 10.0, 15.0, 30.0, 28.0, 57.0, 90.0, 125.0, 154.0, 130.0, 99.0, 90.0, 49.0, 30.0, 15.0, 19.0, 12.0, 7.0, 10.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.467632293701172e-05, -2.3876316845417023e-05, -2.3076310753822327e-05, -2.227630466222763e-05, -2.1476298570632935e-05, -2.067629247903824e-05, -1.9876286387443542e-05, -1.9076280295848846e-05, -1.827627420425415e-05, -1.7476268112659454e-05, -1.6676262021064758e-05, -1.5876255929470062e-05, -1.5076249837875366e-05, -1.427624374628067e-05, -1.3476237654685974e-05, -1.2676231563091278e-05, -1.1876225471496582e-05, -1.1076219379901886e-05, -1.027621328830719e-05, -9.476207196712494e-06, -8.676201105117798e-06, -7.876195013523102e-06, -7.076188921928406e-06, -6.27618283033371e-06, -5.476176738739014e-06, -4.676170647144318e-06, -3.876164555549622e-06, -3.0761584639549255e-06, -2.2761523723602295e-06, -1.4761462807655334e-06, -6.761401891708374e-07, 1.2386590242385864e-07, 9.238719940185547e-07, 1.7238780856132507e-06, 2.5238841772079468e-06, 3.323890268802643e-06, 4.123896360397339e-06, 4.923902451992035e-06, 5.723908543586731e-06, 6.523914635181427e-06, 7.323920726776123e-06, 8.123926818370819e-06, 8.923932909965515e-06, 9.723939001560211e-06, 1.0523945093154907e-05, 1.1323951184749603e-05, 1.21239572763443e-05, 1.2923963367938995e-05, 1.3723969459533691e-05, 1.4523975551128387e-05, 1.5323981642723083e-05, 1.612398773431778e-05, 1.6923993825912476e-05, 1.772399991750717e-05, 1.8524006009101868e-05, 1.9324012100696564e-05, 2.012401819229126e-05, 2.0924024283885956e-05, 2.1724030375480652e-05, 2.2524036467075348e-05, 2.3324042558670044e-05, 2.412404865026474e-05, 2.4924054741859436e-05, 2.5724060833454132e-05, 2.6524066925048828e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 9.0, 13.0, 10.0, 12.0, 24.0, 18.0, 24.0, 40.0, 64.0, 110.0, 161.0, 289.0, 603.0, 1480.0, 6161.0, 173889.0, 853289.0, 8962.0, 1785.0, 707.0, 335.0, 183.0, 109.0, 89.0, 64.0, 28.0, 21.0, 21.0, 15.0, 12.0, 11.0, 6.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1019287109375, -0.09786605834960938, -0.09380340576171875, -0.08974075317382812, -0.0856781005859375, -0.08161544799804688, -0.07755279541015625, -0.07349014282226562, -0.069427490234375, -0.06536483764648438, -0.06130218505859375, -0.057239532470703125, -0.0531768798828125, -0.049114227294921875, -0.04505157470703125, -0.040988922119140625, -0.03692626953125, -0.032863616943359375, -0.02880096435546875, -0.024738311767578125, -0.0206756591796875, -0.016613006591796875, -0.01255035400390625, -0.008487701416015625, -0.004425048828125, -0.000362396240234375, 0.00370025634765625, 0.007762908935546875, 0.0118255615234375, 0.015888214111328125, 0.01995086669921875, 0.024013519287109375, 0.028076171875, 0.032138824462890625, 0.03620147705078125, 0.040264129638671875, 0.0443267822265625, 0.048389434814453125, 0.05245208740234375, 0.056514739990234375, 0.060577392578125, 0.06464004516601562, 0.06870269775390625, 0.07276535034179688, 0.0768280029296875, 0.08089065551757812, 0.08495330810546875, 0.08901596069335938, 0.09307861328125, 0.09714126586914062, 0.10120391845703125, 0.10526657104492188, 0.1093292236328125, 0.11339187622070312, 0.11745452880859375, 0.12151718139648438, 0.125579833984375, 0.12964248657226562, 0.13370513916015625, 0.13776779174804688, 0.1418304443359375, 0.14589309692382812, 0.14995574951171875, 0.15401840209960938, 0.1580810546875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 8.0, 10.0, 9.0, 17.0, 19.0, 26.0, 35.0, 61.0, 120.0, 258.0, 164.0, 75.0, 43.0, 37.0, 37.0, 14.0, 11.0, 4.0, 8.0, 11.0, 2.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019805908203125, -0.018972396850585938, -0.018138885498046875, -0.017305374145507812, -0.01647186279296875, -0.015638351440429688, -0.014804840087890625, -0.013971328735351562, -0.0131378173828125, -0.012304306030273438, -0.011470794677734375, -0.010637283325195312, -0.00980377197265625, -0.008970260620117188, -0.008136749267578125, -0.0073032379150390625, -0.0064697265625, -0.0056362152099609375, -0.004802703857421875, -0.0039691925048828125, -0.00313568115234375, -0.0023021697998046875, -0.001468658447265625, -0.0006351470947265625, 0.0001983642578125, 0.0010318756103515625, 0.001865386962890625, 0.0026988983154296875, 0.00353240966796875, 0.0043659210205078125, 0.005199432373046875, 0.0060329437255859375, 0.006866455078125, 0.0076999664306640625, 0.008533477783203125, 0.009366989135742188, 0.01020050048828125, 0.011034011840820312, 0.011867523193359375, 0.012701034545898438, 0.0135345458984375, 0.014368057250976562, 0.015201568603515625, 0.016035079956054688, 0.01686859130859375, 0.017702102661132812, 0.018535614013671875, 0.019369125366210938, 0.02020263671875, 0.021036148071289062, 0.021869659423828125, 0.022703170776367188, 0.02353668212890625, 0.024370193481445312, 0.025203704833984375, 0.026037216186523438, 0.0268707275390625, 0.027704238891601562, 0.028537750244140625, 0.029371261596679688, 0.03020477294921875, 0.031038284301757812, 0.031871795654296875, 0.03270530700683594, 0.033538818359375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 15.0, 69.0, 821.0, 63.0, 15.0, 7.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6119351387023926, -1.5607823133468628, -1.509629487991333, -1.4584765434265137, -1.4073237180709839, -1.356170892715454, -1.3050180673599243, -1.2538652420043945, -1.2027122974395752, -1.1515594720840454, -1.1004066467285156, -1.0492537021636963, -0.9981008768081665, -0.9469480514526367, -0.8957952260971069, -0.8446423411369324, -0.7934895157814026, -0.7423366904258728, -0.6911838054656982, -0.6400309801101685, -0.5888780951499939, -0.5377252697944641, -0.48657241463661194, -0.43541955947875977, -0.3842667043209076, -0.3331138491630554, -0.28196099400520325, -0.23080815374851227, -0.1796552985906601, -0.12850245833396912, -0.07734960317611694, -0.02619674801826477, 0.024956107139587402, 0.07610896229743958, 0.12726181745529175, 0.17841465771198273, 0.2295675128698349, 0.2807203531265259, 0.33187320828437805, 0.3830260634422302, 0.4341789186000824, 0.48533177375793457, 0.5364845991134644, 0.5876374840736389, 0.6387903094291687, 0.6899431943893433, 0.741096019744873, 0.7922488451004028, 0.8434017300605774, 0.8945545554161072, 0.9457074403762817, 0.9968602657318115, 1.0480130910873413, 1.099165916442871, 1.1503188610076904, 1.2014716863632202, 1.25262451171875, 1.3037773370742798, 1.3549301624298096, 1.406083106994629, 1.4572359323501587, 1.5083887577056885, 1.5595415830612183, 1.610694408416748, 1.6618473529815674]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 4.0, 5.0, 7.0, 10.0, 10.0, 16.0, 16.0, 41.0, 66.0, 96.0, 172.0, 181.0, 123.0, 93.0, 56.0, 31.0, 8.0, 21.0, 5.0, 5.0, 8.0, 6.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3071763515472412, -0.2950688600540161, -0.282961368560791, -0.2708538770675659, -0.25874635577201843, -0.24663886427879333, -0.23453137278556824, -0.22242388129234314, -0.21031638979911804, -0.19820889830589294, -0.18610139191150665, -0.17399390041828156, -0.16188640892505646, -0.14977890253067017, -0.13767141103744507, -0.12556391954421997, -0.11345641314983368, -0.10134891420602798, -0.08924142271280289, -0.07713392376899719, -0.0650264322757721, -0.0529189333319664, -0.040811434388160706, -0.028703942894935608, -0.016596443951129913, -0.004488947801291943, 0.007618548348546028, 0.019726045429706573, 0.03183354064822197, 0.043941035866737366, 0.05604853481054306, 0.06815602630376816, 0.08026352524757385, 0.09237102419137955, 0.10447851568460464, 0.11658601462841034, 0.12869350612163544, 0.14080101251602173, 0.15290850400924683, 0.16501599550247192, 0.17712348699569702, 0.18923097848892212, 0.2013384848833084, 0.2134459763765335, 0.2255534678697586, 0.2376609742641449, 0.24976846575737, 0.2618759572505951, 0.2739834785461426, 0.2860909700393677, 0.2981984615325928, 0.31030595302581787, 0.32241347432136536, 0.33452096581459045, 0.34662845730781555, 0.35873594880104065, 0.37084344029426575, 0.38295093178749084, 0.39505842328071594, 0.4071659445762634, 0.4192734360694885, 0.4313809275627136, 0.4434884190559387, 0.4555959105491638, 0.4677034020423889]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 3.0, 3.0, 6.0, 6.0, 5.0, 5.0, 22.0, 12.0, 21.0, 32.0, 45.0, 87.0, 377.0, 10388.0, 4175244.0, 7491.0, 325.0, 61.0, 39.0, 27.0, 10.0, 23.0, 11.0, 6.0, 7.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.263671875, -3.166107177734375, -3.06854248046875, -2.970977783203125, -2.8734130859375, -2.775848388671875, -2.67828369140625, -2.580718994140625, -2.483154296875, -2.385589599609375, -2.28802490234375, -2.190460205078125, -2.0928955078125, -1.995330810546875, -1.89776611328125, -1.800201416015625, -1.70263671875, -1.605072021484375, -1.50750732421875, -1.409942626953125, -1.3123779296875, -1.214813232421875, -1.11724853515625, -1.019683837890625, -0.922119140625, -0.824554443359375, -0.72698974609375, -0.629425048828125, -0.5318603515625, -0.434295654296875, -0.33673095703125, -0.239166259765625, -0.1416015625, -0.044036865234375, 0.05352783203125, 0.151092529296875, 0.2486572265625, 0.346221923828125, 0.44378662109375, 0.541351318359375, 0.638916015625, 0.736480712890625, 0.83404541015625, 0.931610107421875, 1.0291748046875, 1.126739501953125, 1.22430419921875, 1.321868896484375, 1.41943359375, 1.516998291015625, 1.61456298828125, 1.712127685546875, 1.8096923828125, 1.907257080078125, 2.00482177734375, 2.102386474609375, 2.199951171875, 2.297515869140625, 2.39508056640625, 2.492645263671875, 2.5902099609375, 2.687774658203125, 2.78533935546875, 2.882904052734375, 2.98046875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 4.0, 1.0, 10.0, 7.0, 10.0, 3.0, 11.0, 22.0, 49.0, 73.0, 169.0, 232.0, 163.0, 94.0, 44.0, 30.0, 15.0, 4.0, 9.0, 3.0, 7.0, 4.0, 9.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0038433074951171875, -0.003741025924682617, -0.003638744354248047, -0.0035364627838134766, -0.0034341812133789062, -0.003331899642944336, -0.0032296180725097656, -0.0031273365020751953, -0.003025054931640625, -0.0029227733612060547, -0.0028204917907714844, -0.002718210220336914, -0.0026159286499023438, -0.0025136470794677734, -0.002411365509033203, -0.002309083938598633, -0.0022068023681640625, -0.002104520797729492, -0.002002239227294922, -0.0018999576568603516, -0.0017976760864257812, -0.001695394515991211, -0.0015931129455566406, -0.0014908313751220703, -0.0013885498046875, -0.0012862682342529297, -0.0011839866638183594, -0.001081705093383789, -0.0009794235229492188, -0.0008771419525146484, -0.0007748603820800781, -0.0006725788116455078, -0.0005702972412109375, -0.0004680156707763672, -0.0003657341003417969, -0.00026345252990722656, -0.00016117095947265625, -5.888938903808594e-05, 4.3392181396484375e-05, 0.0001456737518310547, 0.000247955322265625, 0.0003502368927001953, 0.0004525184631347656, 0.0005548000335693359, 0.0006570816040039062, 0.0007593631744384766, 0.0008616447448730469, 0.0009639263153076172, 0.0010662078857421875, 0.0011684894561767578, 0.0012707710266113281, 0.0013730525970458984, 0.0014753341674804688, 0.001577615737915039, 0.0016798973083496094, 0.0017821788787841797, 0.00188446044921875, 0.0019867420196533203, 0.0020890235900878906, 0.002191305160522461, 0.0022935867309570312, 0.0023958683013916016, 0.002498149871826172, 0.002600431442260742, 0.0027027130126953125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 12.0, 12.0, 15.0, 16.0, 28.0, 39.0, 47.0, 59.0, 67.0, 78.0, 110.0, 129.0, 376.0, 25231.0, 4163854.0, 3079.0, 319.0, 149.0, 118.0, 94.0, 100.0, 66.0, 63.0, 48.0, 35.0, 33.0, 32.0, 23.0, 9.0, 12.0, 3.0, 4.0, 7.0, 6.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3620452880859375, -0.344207763671875, -0.3263702392578125, -0.30853271484375, -0.2906951904296875, -0.272857666015625, -0.2550201416015625, -0.2371826171875, -0.2193450927734375, -0.201507568359375, -0.1836700439453125, -0.16583251953125, -0.1479949951171875, -0.130157470703125, -0.1123199462890625, -0.094482421875, -0.0766448974609375, -0.058807373046875, -0.0409698486328125, -0.02313232421875, -0.0052947998046875, 0.012542724609375, 0.0303802490234375, 0.0482177734375, 0.0660552978515625, 0.083892822265625, 0.1017303466796875, 0.11956787109375, 0.1374053955078125, 0.155242919921875, 0.1730804443359375, 0.19091796875, 0.2087554931640625, 0.226593017578125, 0.2444305419921875, 0.26226806640625, 0.2801055908203125, 0.297943115234375, 0.3157806396484375, 0.3336181640625, 0.3514556884765625, 0.369293212890625, 0.3871307373046875, 0.40496826171875, 0.4228057861328125, 0.440643310546875, 0.4584808349609375, 0.476318359375, 0.4941558837890625, 0.511993408203125, 0.5298309326171875, 0.54766845703125, 0.5655059814453125, 0.583343505859375, 0.6011810302734375, 0.6190185546875, 0.6368560791015625, 0.654693603515625, 0.6725311279296875, 0.69036865234375, 0.7082061767578125, 0.726043701171875, 0.7438812255859375, 0.76171875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 10.0, 8.0, 9.0, 13.0, 22.0, 18.0, 37.0, 46.0, 62.0, 80.0, 88.0, 116.0, 128.0, 179.0, 258.0, 464.0, 1000.0, 307.0, 262.0, 199.0, 144.0, 108.0, 103.0, 96.0, 63.0, 60.0, 50.0, 41.0, 21.0, 15.0, 13.0, 12.0, 14.0, 5.0, 10.0, 6.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00516510009765625, -0.004999339580535889, -0.004833579063415527, -0.004667818546295166, -0.004502058029174805, -0.004336297512054443, -0.004170536994934082, -0.004004776477813721, -0.0038390159606933594, -0.003673255443572998, -0.0035074949264526367, -0.0033417344093322754, -0.003175973892211914, -0.0030102133750915527, -0.0028444528579711914, -0.00267869234085083, -0.0025129318237304688, -0.0023471713066101074, -0.002181410789489746, -0.0020156502723693848, -0.0018498897552490234, -0.0016841292381286621, -0.0015183687210083008, -0.0013526082038879395, -0.0011868476867675781, -0.0010210871696472168, -0.0008553266525268555, -0.0006895661354064941, -0.0005238056182861328, -0.0003580451011657715, -0.00019228458404541016, -2.6524066925048828e-05, 0.0001392364501953125, 0.00030499696731567383, 0.00047075748443603516, 0.0006365180015563965, 0.0008022785186767578, 0.0009680390357971191, 0.0011337995529174805, 0.0012995600700378418, 0.0014653205871582031, 0.0016310811042785645, 0.0017968416213989258, 0.001962602138519287, 0.0021283626556396484, 0.0022941231727600098, 0.002459883689880371, 0.0026256442070007324, 0.0027914047241210938, 0.002957165241241455, 0.0031229257583618164, 0.0032886862754821777, 0.003454446792602539, 0.0036202073097229004, 0.0037859678268432617, 0.003951728343963623, 0.004117488861083984, 0.004283249378204346, 0.004449009895324707, 0.004614770412445068, 0.00478053092956543, 0.004946291446685791, 0.005112051963806152, 0.005277812480926514, 0.005443572998046875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [5.0, 936.0, 70.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06874086707830429, -0.023419111967086792, 0.021902643144130707, 0.06722439080476761, 0.1125461533665657, 0.1578679084777832, 0.2031896412372589, 0.248511403799057, 0.2938331663608551, 0.3391549289226532, 0.3844766616821289, 0.429798424243927, 0.4751201868057251, 0.5204419493675232, 0.5657637119293213, 0.6110854148864746, 0.6564072370529175, 0.7017289996147156, 0.7470507621765137, 0.792372465133667, 0.8376942873001099, 0.8830159902572632, 0.9283377528190613, 0.9736595153808594, 1.0189812183380127, 1.064302921295166, 1.1096247434616089, 1.1549464464187622, 1.200268268585205, 1.2455899715423584, 1.2909116744995117, 1.3362334966659546, 1.3815553188323975, 1.4268770217895508, 1.4721988439559937, 1.517520546913147, 1.5628423690795898, 1.6081640720367432, 1.6534857749938965, 1.6988075971603394, 1.7441294193267822, 1.7894511222839355, 1.8347729444503784, 1.8800946474075317, 1.9254164695739746, 1.970738172531128, 2.0160598754882812, 2.0613818168640137, 2.106703281402588, 2.152024984359741, 2.1973466873168945, 2.242668628692627, 2.2879903316497803, 2.3333120346069336, 2.378633737564087, 2.4239554405212402, 2.4692773818969727, 2.514599084854126, 2.5599207878112793, 2.6052427291870117, 2.650564432144165, 2.6958861351013184, 2.7412078380584717, 2.786529541015625, 2.8318514823913574]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 7.0, 18.0, 20.0, 38.0, 48.0, 56.0, 96.0, 147.0, 118.0, 125.0, 101.0, 79.0, 60.0, 35.0, 28.0, 17.0, 9.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052376389503479004, -0.04838957265019417, -0.04440275579690933, -0.040415938943624496, -0.03642912209033966, -0.032442305237054825, -0.02845548838376999, -0.024468671530485153, -0.020481854677200317, -0.01649503782391548, -0.012508220970630646, -0.00852140411734581, -0.004534587264060974, -0.0005477704107761383, 0.0034390464425086975, 0.007425863295793533, 0.01141268014907837, 0.015399497002363205, 0.01938631385564804, 0.023373130708932877, 0.027359947562217712, 0.03134676441550255, 0.035333581268787384, 0.03932039812207222, 0.043307214975357056, 0.04729403182864189, 0.05128084868192673, 0.05526766553521156, 0.0592544823884964, 0.06324130296707153, 0.06722811609506607, 0.07121492922306061, 0.07520174980163574, 0.07918857038021088, 0.08317538350820541, 0.08716219663619995, 0.09114901721477509, 0.09513583779335022, 0.09912265092134476, 0.1031094640493393, 0.10709628462791443, 0.11108310520648956, 0.1150699183344841, 0.11905673146247864, 0.12304355204105377, 0.1270303726196289, 0.13101717829704285, 0.13500399887561798, 0.13899081945419312, 0.14297764003276825, 0.14696446061134338, 0.15095126628875732, 0.15493808686733246, 0.1589249074459076, 0.16291171312332153, 0.16689853370189667, 0.1708853542804718, 0.17487217485904694, 0.17885899543762207, 0.182845801115036, 0.18683262169361115, 0.19081944227218628, 0.19480624794960022, 0.19879306852817535, 0.2027798891067505]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 9.0, 15.0, 20.0, 21.0, 46.0, 41.0, 93.0, 108.0, 185.0, 257.0, 407.0, 612.0, 1076.0, 1730.0, 3101.0, 6196.0, 13778.0, 40129.0, 299962.0, 583648.0, 62545.0, 17851.0, 7617.0, 3774.0, 2024.0, 1204.0, 740.0, 454.0, 292.0, 201.0, 137.0, 96.0, 65.0, 34.0, 24.0, 16.0, 13.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.041534423828125, -0.04020071029663086, -0.03886699676513672, -0.03753328323364258, -0.03619956970214844, -0.0348658561706543, -0.033532142639160156, -0.032198429107666016, -0.030864715576171875, -0.029531002044677734, -0.028197288513183594, -0.026863574981689453, -0.025529861450195312, -0.024196147918701172, -0.02286243438720703, -0.02152872085571289, -0.02019500732421875, -0.01886129379272461, -0.01752758026123047, -0.016193866729736328, -0.014860153198242188, -0.013526439666748047, -0.012192726135253906, -0.010859012603759766, -0.009525299072265625, -0.008191585540771484, -0.006857872009277344, -0.005524158477783203, -0.0041904449462890625, -0.002856731414794922, -0.0015230178833007812, -0.00018930435180664062, 0.0011444091796875, 0.0024781227111816406, 0.0038118362426757812, 0.005145549774169922, 0.0064792633056640625, 0.007812976837158203, 0.009146690368652344, 0.010480403900146484, 0.011814117431640625, 0.013147830963134766, 0.014481544494628906, 0.015815258026123047, 0.017148971557617188, 0.018482685089111328, 0.01981639862060547, 0.02115011215209961, 0.02248382568359375, 0.02381753921508789, 0.02515125274658203, 0.026484966278076172, 0.027818679809570312, 0.029152393341064453, 0.030486106872558594, 0.031819820404052734, 0.033153533935546875, 0.034487247467041016, 0.035820960998535156, 0.0371546745300293, 0.03848838806152344, 0.03982210159301758, 0.04115581512451172, 0.04248952865600586, 0.0438232421875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 5.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 6.0, 12.0, 11.0, 12.0, 39.0, 40.0, 51.0, 86.0, 99.0, 123.0, 107.0, 102.0, 83.0, 57.0, 36.0, 26.0, 16.0, 17.0, 11.0, 6.0, 4.0, 9.0, 2.0, 2.0, 2.0, 6.0, 0.0, 2.0, 6.0, 1.0, 4.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002552032470703125, -0.0024698078632354736, -0.0023875832557678223, -0.002305358648300171, -0.0022231340408325195, -0.002140909433364868, -0.002058684825897217, -0.0019764602184295654, -0.001894235610961914, -0.0018120110034942627, -0.0017297863960266113, -0.00164756178855896, -0.0015653371810913086, -0.0014831125736236572, -0.0014008879661560059, -0.0013186633586883545, -0.0012364387512207031, -0.0011542141437530518, -0.0010719895362854004, -0.000989764928817749, -0.0009075403213500977, -0.0008253157138824463, -0.0007430911064147949, -0.0006608664989471436, -0.0005786418914794922, -0.0004964172840118408, -0.00041419267654418945, -0.0003319680690765381, -0.0002497434616088867, -0.00016751885414123535, -8.529424667358398e-05, -3.069639205932617e-06, 7.915496826171875e-05, 0.00016137957572937012, 0.00024360418319702148, 0.00032582879066467285, 0.0004080533981323242, 0.0004902780055999756, 0.000572502613067627, 0.0006547272205352783, 0.0007369518280029297, 0.0008191764354705811, 0.0009014010429382324, 0.0009836256504058838, 0.0010658502578735352, 0.0011480748653411865, 0.0012302994728088379, 0.0013125240802764893, 0.0013947486877441406, 0.001476973295211792, 0.0015591979026794434, 0.0016414225101470947, 0.001723647117614746, 0.0018058717250823975, 0.0018880963325500488, 0.0019703209400177, 0.0020525455474853516, 0.002134770154953003, 0.0022169947624206543, 0.0022992193698883057, 0.002381443977355957, 0.0024636685848236084, 0.0025458931922912598, 0.002628117799758911, 0.0027103424072265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 1.0, 7.0, 5.0, 8.0, 15.0, 20.0, 14.0, 36.0, 26.0, 41.0, 43.0, 65.0, 137.0, 906.0, 21498.0, 1007764.0, 16738.0, 824.0, 150.0, 59.0, 46.0, 26.0, 18.0, 25.0, 23.0, 14.0, 10.0, 9.0, 6.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.133056640625, -0.12821388244628906, -0.12337112426757812, -0.11852836608886719, -0.11368560791015625, -0.10884284973144531, -0.10400009155273438, -0.09915733337402344, -0.0943145751953125, -0.08947181701660156, -0.08462905883789062, -0.07978630065917969, -0.07494354248046875, -0.07010078430175781, -0.06525802612304688, -0.06041526794433594, -0.055572509765625, -0.05072975158691406, -0.045886993408203125, -0.04104423522949219, -0.03620147705078125, -0.03135871887207031, -0.026515960693359375, -0.021673202514648438, -0.0168304443359375, -0.011987686157226562, -0.007144927978515625, -0.0023021697998046875, 0.00254058837890625, 0.0073833465576171875, 0.012226104736328125, 0.017068862915039062, 0.02191162109375, 0.026754379272460938, 0.031597137451171875, 0.03643989562988281, 0.04128265380859375, 0.04612541198730469, 0.050968170166015625, 0.05581092834472656, 0.0606536865234375, 0.06549644470214844, 0.07033920288085938, 0.07518196105957031, 0.08002471923828125, 0.08486747741699219, 0.08971023559570312, 0.09455299377441406, 0.099395751953125, 0.10423851013183594, 0.10908126831054688, 0.11392402648925781, 0.11876678466796875, 0.12360954284667969, 0.12845230102539062, 0.13329505920410156, 0.1381378173828125, 0.14298057556152344, 0.14782333374023438, 0.1526660919189453, 0.15750885009765625, 0.1623516082763672, 0.16719436645507812, 0.17203712463378906, 0.1768798828125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 9.0, 12.0, 9.0, 15.0, 33.0, 22.0, 24.0, 41.0, 26.0, 43.0, 34.0, 55.0, 50.0, 50.0, 48.0, 48.0, 52.0, 57.0, 37.0, 46.0, 41.0, 47.0, 31.0, 33.0, 29.0, 16.0, 21.0, 13.0, 14.0, 12.0, 7.0, 3.0, 8.0, 2.0, 5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.01611328125, -0.01569366455078125, -0.0152740478515625, -0.01485443115234375, -0.014434814453125, -0.01401519775390625, -0.0135955810546875, -0.01317596435546875, -0.01275634765625, -0.01233673095703125, -0.0119171142578125, -0.01149749755859375, -0.011077880859375, -0.01065826416015625, -0.0102386474609375, -0.00981903076171875, -0.0093994140625, -0.00897979736328125, -0.0085601806640625, -0.00814056396484375, -0.007720947265625, -0.00730133056640625, -0.0068817138671875, -0.00646209716796875, -0.00604248046875, -0.00562286376953125, -0.0052032470703125, -0.00478363037109375, -0.004364013671875, -0.00394439697265625, -0.0035247802734375, -0.00310516357421875, -0.002685546875, -0.00226593017578125, -0.0018463134765625, -0.00142669677734375, -0.001007080078125, -0.00058746337890625, -0.0001678466796875, 0.00025177001953125, 0.00067138671875, 0.00109100341796875, 0.0015106201171875, 0.00193023681640625, 0.002349853515625, 0.00276947021484375, 0.0031890869140625, 0.00360870361328125, 0.0040283203125, 0.00444793701171875, 0.0048675537109375, 0.00528717041015625, 0.005706787109375, 0.00612640380859375, 0.0065460205078125, 0.00696563720703125, 0.00738525390625, 0.00780487060546875, 0.0082244873046875, 0.00864410400390625, 0.009063720703125, 0.00948333740234375, 0.0099029541015625, 0.01032257080078125, 0.0107421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 3.0, 5.0, 7.0, 3.0, 8.0, 7.0, 5.0, 10.0, 13.0, 15.0, 13.0, 36.0, 48.0, 129.0, 581.0, 4178.0, 963213.0, 77670.0, 1962.0, 385.0, 89.0, 48.0, 33.0, 14.0, 12.0, 7.0, 8.0, 11.0, 7.0, 4.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.09429931640625, -0.09103107452392578, -0.08776283264160156, -0.08449459075927734, -0.08122634887695312, -0.0779581069946289, -0.07468986511230469, -0.07142162322998047, -0.06815338134765625, -0.06488513946533203, -0.06161689758300781, -0.058348655700683594, -0.055080413818359375, -0.051812171936035156, -0.04854393005371094, -0.04527568817138672, -0.0420074462890625, -0.03873920440673828, -0.03547096252441406, -0.032202720642089844, -0.028934478759765625, -0.025666236877441406, -0.022397994995117188, -0.01912975311279297, -0.01586151123046875, -0.012593269348144531, -0.009325027465820312, -0.006056785583496094, -0.002788543701171875, 0.00047969818115234375, 0.0037479400634765625, 0.007016181945800781, 0.010284423828125, 0.013552665710449219, 0.016820907592773438, 0.020089149475097656, 0.023357391357421875, 0.026625633239746094, 0.029893875122070312, 0.03316211700439453, 0.03643035888671875, 0.03969860076904297, 0.04296684265136719, 0.046235084533691406, 0.049503326416015625, 0.052771568298339844, 0.05603981018066406, 0.05930805206298828, 0.0625762939453125, 0.06584453582763672, 0.06911277770996094, 0.07238101959228516, 0.07564926147460938, 0.0789175033569336, 0.08218574523925781, 0.08545398712158203, 0.08872222900390625, 0.09199047088623047, 0.09525871276855469, 0.0985269546508789, 0.10179519653320312, 0.10506343841552734, 0.10833168029785156, 0.11159992218017578, 0.1148681640625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 10.0, 7.0, 15.0, 20.0, 24.0, 47.0, 141.0, 383.0, 198.0, 64.0, 20.0, 20.0, 14.0, 11.0, 10.0, 8.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00023555755615234375, -0.00023016054183244705, -0.00022476352751255035, -0.00021936651319265366, -0.00021396949887275696, -0.00020857248455286026, -0.00020317547023296356, -0.00019777845591306686, -0.00019238144159317017, -0.00018698442727327347, -0.00018158741295337677, -0.00017619039863348007, -0.00017079338431358337, -0.00016539636999368668, -0.00015999935567378998, -0.00015460234135389328, -0.00014920532703399658, -0.00014380831271409988, -0.00013841129839420319, -0.0001330142840743065, -0.0001276172697544098, -0.0001222202554345131, -0.0001168232411146164, -0.0001114262267947197, -0.000106029212474823, -0.0001006321981549263, -9.52351838350296e-05, -8.98381695151329e-05, -8.44411551952362e-05, -7.904414087533951e-05, -7.364712655544281e-05, -6.825011223554611e-05, -6.285309791564941e-05, -5.7456083595752716e-05, -5.205906927585602e-05, -4.666205495595932e-05, -4.126504063606262e-05, -3.5868026316165924e-05, -3.0471011996269226e-05, -2.5073997676372528e-05, -1.967698335647583e-05, -1.4279969036579132e-05, -8.882954716682434e-06, -3.485940396785736e-06, 1.911073923110962e-06, 7.30808824300766e-06, 1.2705102562904358e-05, 1.8102116882801056e-05, 2.3499131202697754e-05, 2.8896145522594452e-05, 3.429315984249115e-05, 3.969017416238785e-05, 4.5087188482284546e-05, 5.0484202802181244e-05, 5.588121712207794e-05, 6.127823144197464e-05, 6.667524576187134e-05, 7.207226008176804e-05, 7.746927440166473e-05, 8.286628872156143e-05, 8.826330304145813e-05, 9.366031736135483e-05, 9.905733168125153e-05, 0.00010445434600114822, 0.00010985136032104492]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 7.0, 13.0, 6.0, 12.0, 22.0, 33.0, 79.0, 143.0, 343.0, 972.0, 3276.0, 18176.0, 871556.0, 141610.0, 9132.0, 2041.0, 668.0, 226.0, 105.0, 49.0, 20.0, 22.0, 13.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09539794921875, -0.09257888793945312, -0.08975982666015625, -0.08694076538085938, -0.0841217041015625, -0.08130264282226562, -0.07848358154296875, -0.07566452026367188, -0.072845458984375, -0.07002639770507812, -0.06720733642578125, -0.06438827514648438, -0.0615692138671875, -0.058750152587890625, -0.05593109130859375, -0.053112030029296875, -0.05029296875, -0.047473907470703125, -0.04465484619140625, -0.041835784912109375, -0.0390167236328125, -0.036197662353515625, -0.03337860107421875, -0.030559539794921875, -0.027740478515625, -0.024921417236328125, -0.02210235595703125, -0.019283294677734375, -0.0164642333984375, -0.013645172119140625, -0.01082611083984375, -0.008007049560546875, -0.00518798828125, -0.002368927001953125, 0.00045013427734375, 0.003269195556640625, 0.0060882568359375, 0.008907318115234375, 0.01172637939453125, 0.014545440673828125, 0.017364501953125, 0.020183563232421875, 0.02300262451171875, 0.025821685791015625, 0.0286407470703125, 0.031459808349609375, 0.03427886962890625, 0.037097930908203125, 0.0399169921875, 0.042736053466796875, 0.04555511474609375, 0.048374176025390625, 0.0511932373046875, 0.054012298583984375, 0.05683135986328125, 0.059650421142578125, 0.062469482421875, 0.06528854370117188, 0.06810760498046875, 0.07092666625976562, 0.0737457275390625, 0.07656478881835938, 0.07938385009765625, 0.08220291137695312, 0.08502197265625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 11.0, 20.0, 36.0, 52.0, 138.0, 457.0, 125.0, 59.0, 37.0, 16.0, 7.0, 7.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030303955078125, -0.029312610626220703, -0.028321266174316406, -0.02732992172241211, -0.026338577270507812, -0.025347232818603516, -0.02435588836669922, -0.023364543914794922, -0.022373199462890625, -0.021381855010986328, -0.02039051055908203, -0.019399166107177734, -0.018407821655273438, -0.01741647720336914, -0.016425132751464844, -0.015433788299560547, -0.01444244384765625, -0.013451099395751953, -0.012459754943847656, -0.01146841049194336, -0.010477066040039062, -0.009485721588134766, -0.008494377136230469, -0.007503032684326172, -0.006511688232421875, -0.005520343780517578, -0.004528999328613281, -0.0035376548767089844, -0.0025463104248046875, -0.0015549659729003906, -0.0005636215209960938, 0.0004277229309082031, 0.0014190673828125, 0.002410411834716797, 0.0034017562866210938, 0.004393100738525391, 0.0053844451904296875, 0.006375789642333984, 0.007367134094238281, 0.008358478546142578, 0.009349822998046875, 0.010341167449951172, 0.011332511901855469, 0.012323856353759766, 0.013315200805664062, 0.01430654525756836, 0.015297889709472656, 0.016289234161376953, 0.01728057861328125, 0.018271923065185547, 0.019263267517089844, 0.02025461196899414, 0.021245956420898438, 0.022237300872802734, 0.02322864532470703, 0.024219989776611328, 0.025211334228515625, 0.026202678680419922, 0.02719402313232422, 0.028185367584228516, 0.029176712036132812, 0.03016805648803711, 0.031159400939941406, 0.0321507453918457, 0.03314208984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 13.0, 57.0, 237.0, 482.0, 161.0, 32.0, 6.0, 4.0, 3.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20942550897598267, -0.19576814770698547, -0.18211078643798828, -0.1684534251689911, -0.1547960638999939, -0.1411387026309967, -0.12748132646083832, -0.11382396519184113, -0.10016660392284393, -0.08650924265384674, -0.07285188138484955, -0.05919451266527176, -0.04553715139627457, -0.031879790127277374, -0.018222421407699585, -0.004565060138702393, 0.0090923011302948, 0.02274966426193714, 0.03640702739357948, 0.050064392387866974, 0.06372175365686417, 0.07737911492586136, 0.09103648364543915, 0.10469384491443634, 0.11835120618343353, 0.13200856745243073, 0.14566592872142792, 0.1593233048915863, 0.1729806661605835, 0.1866380274295807, 0.20029538869857788, 0.21395274996757507, 0.22761011123657227, 0.24126747250556946, 0.25492483377456665, 0.26858219504356384, 0.28223955631256104, 0.2958969175815582, 0.3095542788505554, 0.323211669921875, 0.3368690013885498, 0.350526362657547, 0.3641837239265442, 0.3778410851955414, 0.3914984464645386, 0.40515580773353577, 0.41881316900253296, 0.43247056007385254, 0.44612792134284973, 0.4597852826118469, 0.4734426438808441, 0.4871000051498413, 0.5007573962211609, 0.5144147276878357, 0.5280721187591553, 0.5417294502258301, 0.5553868412971497, 0.5690442323684692, 0.582701563835144, 0.5963589549064636, 0.6100162863731384, 0.623673677444458, 0.6373310089111328, 0.6509883999824524, 0.6646457314491272]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 11.0, 19.0, 37.0, 47.0, 95.0, 131.0, 145.0, 145.0, 104.0, 93.0, 70.0, 34.0, 24.0, 17.0, 9.0, 6.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3931443691253662, -0.38505929708480835, -0.3769742250442505, -0.3688891530036926, -0.36080408096313477, -0.3527189791202545, -0.34463390707969666, -0.3365488350391388, -0.32846376299858093, -0.32037869095802307, -0.3122936189174652, -0.30420854687690735, -0.2961234450340271, -0.28803837299346924, -0.2799533009529114, -0.2718682289123535, -0.26378315687179565, -0.2556980848312378, -0.24761301279067993, -0.23952792584896088, -0.23144285380840302, -0.22335778176784515, -0.2152726948261261, -0.20718762278556824, -0.19910255074501038, -0.19101747870445251, -0.18293240666389465, -0.1748473197221756, -0.16676224768161774, -0.15867717564105988, -0.15059208869934082, -0.14250701665878296, -0.1344219446182251, -0.12633687257766724, -0.11825179308652878, -0.11016671359539032, -0.10208164155483246, -0.0939965695142746, -0.08591149002313614, -0.07782641053199768, -0.06974133849143982, -0.06165626272559166, -0.0535711869597435, -0.04548611119389534, -0.03740103542804718, -0.02931595966219902, -0.02123088389635086, -0.0131458081305027, -0.005060732364654541, 0.0030243434011936188, 0.011109419167041779, 0.01919449493288994, 0.027279570698738098, 0.03536464646458626, 0.04344972223043442, 0.05153479799628258, 0.05961987376213074, 0.0677049458026886, 0.07579002529382706, 0.08387510478496552, 0.09196017682552338, 0.10004524886608124, 0.1081303283572197, 0.11621540784835815, 0.12430047988891602]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 8.0, 8.0, 8.0, 14.0, 14.0, 12.0, 25.0, 23.0, 16.0, 30.0, 43.0, 171.0, 1197.0, 4192174.0, 331.0, 44.0, 32.0, 14.0, 14.0, 20.0, 8.0, 10.0, 4.0, 10.0, 8.0, 10.0, 2.0, 0.0, 8.0, 0.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.87109375, -1.814910888671875, -1.75872802734375, -1.702545166015625, -1.6463623046875, -1.590179443359375, -1.53399658203125, -1.477813720703125, -1.421630859375, -1.365447998046875, -1.30926513671875, -1.253082275390625, -1.1968994140625, -1.140716552734375, -1.08453369140625, -1.028350830078125, -0.97216796875, -0.915985107421875, -0.85980224609375, -0.803619384765625, -0.7474365234375, -0.691253662109375, -0.63507080078125, -0.578887939453125, -0.522705078125, -0.466522216796875, -0.41033935546875, -0.354156494140625, -0.2979736328125, -0.241790771484375, -0.18560791015625, -0.129425048828125, -0.0732421875, -0.017059326171875, 0.03912353515625, 0.095306396484375, 0.1514892578125, 0.207672119140625, 0.26385498046875, 0.320037841796875, 0.376220703125, 0.432403564453125, 0.48858642578125, 0.544769287109375, 0.6009521484375, 0.657135009765625, 0.71331787109375, 0.769500732421875, 0.82568359375, 0.881866455078125, 0.93804931640625, 0.994232177734375, 1.0504150390625, 1.106597900390625, 1.16278076171875, 1.218963623046875, 1.275146484375, 1.331329345703125, 1.38751220703125, 1.443695068359375, 1.4998779296875, 1.556060791015625, 1.61224365234375, 1.668426513671875, 1.724609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 13.0, 24.0, 44.0, 128.0, 246.0, 280.0, 162.0, 58.0, 20.0, 10.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.01215362548828125, -0.011924535036087036, -0.011695444583892822, -0.011466354131698608, -0.011237263679504395, -0.01100817322731018, -0.010779082775115967, -0.010549992322921753, -0.010320901870727539, -0.010091811418533325, -0.009862720966339111, -0.009633630514144897, -0.009404540061950684, -0.00917544960975647, -0.008946359157562256, -0.008717268705368042, -0.008488178253173828, -0.008259087800979614, -0.0080299973487854, -0.0078009068965911865, -0.007571816444396973, -0.007342725992202759, -0.007113635540008545, -0.006884545087814331, -0.006655454635620117, -0.006426364183425903, -0.0061972737312316895, -0.005968183279037476, -0.005739092826843262, -0.005510002374649048, -0.005280911922454834, -0.00505182147026062, -0.004822731018066406, -0.004593640565872192, -0.0043645501136779785, -0.004135459661483765, -0.003906369209289551, -0.003677278757095337, -0.003448188304901123, -0.003219097852706909, -0.0029900074005126953, -0.0027609169483184814, -0.0025318264961242676, -0.0023027360439300537, -0.00207364559173584, -0.001844555139541626, -0.0016154646873474121, -0.0013863742351531982, -0.0011572837829589844, -0.0009281933307647705, -0.0006991028785705566, -0.0004700124263763428, -0.0002409219741821289, -1.1831521987915039e-05, 0.00021725893020629883, 0.0004463493824005127, 0.0006754398345947266, 0.0009045302867889404, 0.0011336207389831543, 0.0013627111911773682, 0.001591801643371582, 0.001820892095565796, 0.0020499825477600098, 0.0022790729999542236, 0.0025081634521484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 6.0, 14.0, 16.0, 45.0, 150.0, 954.0, 4190879.0, 1984.0, 158.0, 46.0, 19.0, 7.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-1.7861328125, -1.7521743774414062, -1.7182159423828125, -1.6842575073242188, -1.650299072265625, -1.6163406372070312, -1.5823822021484375, -1.5484237670898438, -1.51446533203125, -1.4805068969726562, -1.4465484619140625, -1.4125900268554688, -1.378631591796875, -1.3446731567382812, -1.3107147216796875, -1.2767562866210938, -1.2427978515625, -1.2088394165039062, -1.1748809814453125, -1.1409225463867188, -1.106964111328125, -1.0730056762695312, -1.0390472412109375, -1.0050888061523438, -0.97113037109375, -0.9371719360351562, -0.9032135009765625, -0.8692550659179688, -0.835296630859375, -0.8013381958007812, -0.7673797607421875, -0.7334213256835938, -0.699462890625, -0.6655044555664062, -0.6315460205078125, -0.5975875854492188, -0.563629150390625, -0.5296707153320312, -0.4957122802734375, -0.46175384521484375, -0.42779541015625, -0.39383697509765625, -0.3598785400390625, -0.32592010498046875, -0.291961669921875, -0.25800323486328125, -0.2240447998046875, -0.19008636474609375, -0.1561279296875, -0.12216949462890625, -0.0882110595703125, -0.05425262451171875, -0.020294189453125, 0.01366424560546875, 0.0476226806640625, 0.08158111572265625, 0.11553955078125, 0.14949798583984375, 0.1834564208984375, 0.21741485595703125, 0.251373291015625, 0.28533172607421875, 0.3192901611328125, 0.35324859619140625, 0.38720703125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 12.0, 22.0, 24.0, 58.0, 131.0, 349.0, 2262.0, 786.0, 222.0, 88.0, 59.0, 28.0, 10.0, 9.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.02386474609375, -0.023343324661254883, -0.022821903228759766, -0.02230048179626465, -0.02177906036376953, -0.021257638931274414, -0.020736217498779297, -0.02021479606628418, -0.019693374633789062, -0.019171953201293945, -0.018650531768798828, -0.01812911033630371, -0.017607688903808594, -0.017086267471313477, -0.01656484603881836, -0.016043424606323242, -0.015522003173828125, -0.015000581741333008, -0.01447916030883789, -0.013957738876342773, -0.013436317443847656, -0.012914896011352539, -0.012393474578857422, -0.011872053146362305, -0.011350631713867188, -0.01082921028137207, -0.010307788848876953, -0.009786367416381836, -0.009264945983886719, -0.008743524551391602, -0.008222103118896484, -0.007700681686401367, -0.00717926025390625, -0.006657838821411133, -0.006136417388916016, -0.0056149959564208984, -0.005093574523925781, -0.004572153091430664, -0.004050731658935547, -0.0035293102264404297, -0.0030078887939453125, -0.0024864673614501953, -0.001965045928955078, -0.001443624496459961, -0.0009222030639648438, -0.00040078163146972656, 0.00012063980102539062, 0.0006420612335205078, 0.001163482666015625, 0.0016849040985107422, 0.0022063255310058594, 0.0027277469635009766, 0.0032491683959960938, 0.003770589828491211, 0.004292011260986328, 0.004813432693481445, 0.0053348541259765625, 0.00585627555847168, 0.006377696990966797, 0.006899118423461914, 0.007420539855957031, 0.007941961288452148, 0.008463382720947266, 0.008984804153442383, 0.0095062255859375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 29.0, 984.0, 8.0, 0.0, 2.0], "bins": [-4.319535255432129, -4.2478790283203125, -4.176222324371338, -4.1045660972595215, -4.032909393310547, -3.9612531661987305, -3.889596700668335, -3.8179402351379395, -3.746284008026123, -3.6746275424957275, -3.602971076965332, -3.5313148498535156, -3.45965838432312, -3.3880019187927246, -3.316345453262329, -3.2446889877319336, -3.173032522201538, -3.1013760566711426, -3.029719591140747, -2.9580633640289307, -2.886406898498535, -2.8147504329681396, -2.743093967437744, -2.6714375019073486, -2.599781036376953, -2.5281245708465576, -2.456468105316162, -2.3848118782043457, -2.31315541267395, -2.2414989471435547, -2.169842481613159, -2.0981860160827637, -2.0265297889709473, -1.9548733234405518, -1.8832169771194458, -1.8115605115890503, -1.7399041652679443, -1.6682476997375488, -1.5965912342071533, -1.5249347686767578, -1.4532783031463623, -1.3816218376159668, -1.3099654912948608, -1.2383090257644653, -1.1666526794433594, -1.0949962139129639, -1.0233397483825684, -0.9516833424568176, -0.8800269365310669, -0.8083705306053162, -0.7367141246795654, -0.6650576591491699, -0.5934012532234192, -0.5217448472976685, -0.45008841156959534, -0.3784319758415222, -0.30677559971809387, -0.23511917889118195, -0.16346275806427002, -0.0918063372373581, -0.020149916410446167, 0.051506489515304565, 0.12316292524337769, 0.1948193609714508, 0.26647576689720154]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 9.0, 11.0, 40.0, 112.0, 176.0, 280.0, 222.0, 100.0, 40.0, 19.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5005239844322205, -0.4905659258365631, -0.48060786724090576, -0.4706498384475708, -0.46069177985191345, -0.4507337212562561, -0.44077566266059875, -0.4308176040649414, -0.42085957527160645, -0.4109015166759491, -0.40094345808029175, -0.3909854292869568, -0.38102737069129944, -0.3710693120956421, -0.36111125349998474, -0.3511531949043274, -0.34119513630867004, -0.3312370777130127, -0.32127901911735535, -0.3113209903240204, -0.30136293172836304, -0.2914048731327057, -0.28144681453704834, -0.271488755941391, -0.26153069734573364, -0.2515726387500763, -0.24161459505558014, -0.2316565364599228, -0.22169849276542664, -0.2117404341697693, -0.20178237557411194, -0.1918243169784546, -0.18186628818511963, -0.17190822958946228, -0.16195018589496613, -0.15199212729930878, -0.14203408360481262, -0.13207602500915527, -0.12211796641349792, -0.11215991526842117, -0.10220186412334442, -0.09224381297826767, -0.08228576183319092, -0.07232770323753357, -0.06236965209245682, -0.052411600947380066, -0.042453546077013016, -0.032495491206645966, -0.022537440061569214, -0.012579387053847313, -0.002621334046125412, 0.007336718961596489, 0.01729477196931839, 0.02725282311439514, 0.03721087798476219, 0.04716893285512924, 0.057126984000205994, 0.06708503514528275, 0.0770430862903595, 0.08700114488601685, 0.0969591960310936, 0.10691724717617035, 0.1168753057718277, 0.12683334946632385, 0.1367914080619812]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 9.0, 6.0, 6.0, 10.0, 8.0, 7.0, 10.0, 18.0, 25.0, 12.0, 18.0, 29.0, 27.0, 36.0, 45.0, 49.0, 48.0, 33.0, 112.0, 1008894.0, 38679.0, 65.0, 43.0, 44.0, 43.0, 32.0, 28.0, 30.0, 31.0, 25.0, 22.0, 17.0, 11.0, 17.0, 7.0, 6.0, 13.0, 6.0, 6.0, 6.0, 3.0, 3.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5768661499023438, -0.5575408935546875, -0.5382156372070312, -0.518890380859375, -0.49956512451171875, -0.4802398681640625, -0.46091461181640625, -0.44158935546875, -0.42226409912109375, -0.4029388427734375, -0.38361358642578125, -0.364288330078125, -0.34496307373046875, -0.3256378173828125, -0.30631256103515625, -0.2869873046875, -0.26766204833984375, -0.2483367919921875, -0.22901153564453125, -0.209686279296875, -0.19036102294921875, -0.1710357666015625, -0.15171051025390625, -0.13238525390625, -0.11305999755859375, -0.0937347412109375, -0.07440948486328125, -0.055084228515625, -0.03575897216796875, -0.0164337158203125, 0.00289154052734375, 0.022216796875, 0.04154205322265625, 0.0608673095703125, 0.08019256591796875, 0.099517822265625, 0.11884307861328125, 0.1381683349609375, 0.15749359130859375, 0.17681884765625, 0.19614410400390625, 0.2154693603515625, 0.23479461669921875, 0.254119873046875, 0.27344512939453125, 0.2927703857421875, 0.31209564208984375, 0.3314208984375, 0.35074615478515625, 0.3700714111328125, 0.38939666748046875, 0.408721923828125, 0.42804718017578125, 0.4473724365234375, 0.46669769287109375, 0.48602294921875, 0.5053482055664062, 0.5246734619140625, 0.5439987182617188, 0.563323974609375, 0.5826492309570312, 0.6019744873046875, 0.6212997436523438, 0.640625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 100.0, 640.0, 263.0, 12.0, 1.0, 1.0], "bins": [-0.131103515625, -0.1289052963256836, -0.1267070770263672, -0.12450885772705078, -0.12231063842773438, -0.12011241912841797, -0.11791419982910156, -0.11571598052978516, -0.11351776123046875, -0.11131954193115234, -0.10912132263183594, -0.10692310333251953, -0.10472488403320312, -0.10252666473388672, -0.10032844543457031, -0.0981302261352539, -0.0959320068359375, -0.0937337875366211, -0.09153556823730469, -0.08933734893798828, -0.08713912963867188, -0.08494091033935547, -0.08274269104003906, -0.08054447174072266, -0.07834625244140625, -0.07614803314208984, -0.07394981384277344, -0.07175159454345703, -0.06955337524414062, -0.06735515594482422, -0.06515693664550781, -0.0629587173461914, -0.060760498046875, -0.058562278747558594, -0.05636405944824219, -0.05416584014892578, -0.051967620849609375, -0.04976940155029297, -0.04757118225097656, -0.045372962951660156, -0.04317474365234375, -0.040976524353027344, -0.03877830505371094, -0.03658008575439453, -0.034381866455078125, -0.03218364715576172, -0.029985427856445312, -0.027787208557128906, -0.0255889892578125, -0.023390769958496094, -0.021192550659179688, -0.01899433135986328, -0.016796112060546875, -0.014597892761230469, -0.012399673461914062, -0.010201454162597656, -0.00800323486328125, -0.005805015563964844, -0.0036067962646484375, -0.0014085769653320312, 0.000789642333984375, 0.0029878616333007812, 0.0051860809326171875, 0.007384300231933594, 0.00958251953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 4.0, 4.0, 16.0, 9.0, 12.0, 11.0, 15.0, 26.0, 56.0, 52.0, 94.0, 132.0, 273.0, 616.0, 1761.0, 8009.0, 66666.0, 828094.0, 126623.0, 12071.0, 2440.0, 749.0, 301.0, 174.0, 109.0, 61.0, 43.0, 28.0, 34.0, 14.0, 16.0, 7.0, 6.0, 5.0, 7.0, 6.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.21826171875, -0.2108917236328125, -0.203521728515625, -0.1961517333984375, -0.18878173828125, -0.1814117431640625, -0.174041748046875, -0.1666717529296875, -0.1593017578125, -0.1519317626953125, -0.144561767578125, -0.1371917724609375, -0.12982177734375, -0.1224517822265625, -0.115081787109375, -0.1077117919921875, -0.100341796875, -0.0929718017578125, -0.085601806640625, -0.0782318115234375, -0.07086181640625, -0.0634918212890625, -0.056121826171875, -0.0487518310546875, -0.0413818359375, -0.0340118408203125, -0.026641845703125, -0.0192718505859375, -0.01190185546875, -0.0045318603515625, 0.002838134765625, 0.0102081298828125, 0.017578125, 0.0249481201171875, 0.032318115234375, 0.0396881103515625, 0.04705810546875, 0.0544281005859375, 0.061798095703125, 0.0691680908203125, 0.0765380859375, 0.0839080810546875, 0.091278076171875, 0.0986480712890625, 0.10601806640625, 0.1133880615234375, 0.120758056640625, 0.1281280517578125, 0.135498046875, 0.1428680419921875, 0.150238037109375, 0.1576080322265625, 0.16497802734375, 0.1723480224609375, 0.179718017578125, 0.1870880126953125, 0.1944580078125, 0.2018280029296875, 0.209197998046875, 0.2165679931640625, 0.22393798828125, 0.2313079833984375, 0.238677978515625, 0.2460479736328125, 0.25341796875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 7.0, 8.0, 5.0, 7.0, 13.0, 13.0, 22.0, 13.0, 24.0, 33.0, 35.0, 47.0, 49.0, 74.0, 54.0, 69.0, 69.0, 85.0, 64.0, 58.0, 55.0, 42.0, 36.0, 24.0, 32.0, 16.0, 14.0, 12.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0933837890625, -0.09018611907958984, -0.08698844909667969, -0.08379077911376953, -0.08059310913085938, -0.07739543914794922, -0.07419776916503906, -0.0710000991821289, -0.06780242919921875, -0.0646047592163086, -0.06140708923339844, -0.05820941925048828, -0.055011749267578125, -0.05181407928466797, -0.04861640930175781, -0.045418739318847656, -0.0422210693359375, -0.039023399353027344, -0.03582572937011719, -0.03262805938720703, -0.029430389404296875, -0.02623271942138672, -0.023035049438476562, -0.019837379455566406, -0.01663970947265625, -0.013442039489746094, -0.010244369506835938, -0.007046699523925781, -0.003849029541015625, -0.0006513595581054688, 0.0025463104248046875, 0.005743980407714844, 0.008941650390625, 0.012139320373535156, 0.015336990356445312, 0.01853466033935547, 0.021732330322265625, 0.02493000030517578, 0.028127670288085938, 0.031325340270996094, 0.03452301025390625, 0.037720680236816406, 0.04091835021972656, 0.04411602020263672, 0.047313690185546875, 0.05051136016845703, 0.05370903015136719, 0.056906700134277344, 0.0601043701171875, 0.06330204010009766, 0.06649971008300781, 0.06969738006591797, 0.07289505004882812, 0.07609272003173828, 0.07929039001464844, 0.0824880599975586, 0.08568572998046875, 0.0888833999633789, 0.09208106994628906, 0.09527873992919922, 0.09847640991210938, 0.10167407989501953, 0.10487174987792969, 0.10806941986083984, 0.11126708984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 8.0, 8.0, 14.0, 19.0, 22.0, 43.0, 54.0, 104.0, 235.0, 499.0, 1327.0, 4524.0, 89877.0, 939701.0, 8738.0, 2026.0, 705.0, 300.0, 122.0, 63.0, 46.0, 20.0, 15.0, 16.0, 7.0, 3.0, 7.0, 7.0, 5.0, 4.0, 5.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64306640625, -0.6242523193359375, -0.605438232421875, -0.5866241455078125, -0.56781005859375, -0.5489959716796875, -0.530181884765625, -0.5113677978515625, -0.4925537109375, -0.4737396240234375, -0.454925537109375, -0.4361114501953125, -0.41729736328125, -0.3984832763671875, -0.379669189453125, -0.3608551025390625, -0.342041015625, -0.3232269287109375, -0.304412841796875, -0.2855987548828125, -0.26678466796875, -0.2479705810546875, -0.229156494140625, -0.2103424072265625, -0.1915283203125, -0.1727142333984375, -0.153900146484375, -0.1350860595703125, -0.11627197265625, -0.0974578857421875, -0.078643798828125, -0.0598297119140625, -0.041015625, -0.0222015380859375, -0.003387451171875, 0.0154266357421875, 0.03424072265625, 0.0530548095703125, 0.071868896484375, 0.0906829833984375, 0.1094970703125, 0.1283111572265625, 0.147125244140625, 0.1659393310546875, 0.18475341796875, 0.2035675048828125, 0.222381591796875, 0.2411956787109375, 0.260009765625, 0.2788238525390625, 0.297637939453125, 0.3164520263671875, 0.33526611328125, 0.3540802001953125, 0.372894287109375, 0.3917083740234375, 0.4105224609375, 0.4293365478515625, 0.448150634765625, 0.4669647216796875, 0.48577880859375, 0.5045928955078125, 0.523406982421875, 0.5422210693359375, 0.56103515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 5.0, 13.0, 21.0, 53.0, 129.0, 378.0, 222.0, 84.0, 46.0, 12.0, 10.0, 3.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.778406143188477e-05, -7.54818320274353e-05, -7.317960262298584e-05, -7.087737321853638e-05, -6.857514381408691e-05, -6.627291440963745e-05, -6.397068500518799e-05, -6.166845560073853e-05, -5.936622619628906e-05, -5.70639967918396e-05, -5.476176738739014e-05, -5.2459537982940674e-05, -5.015730857849121e-05, -4.785507917404175e-05, -4.5552849769592285e-05, -4.325062036514282e-05, -4.094839096069336e-05, -3.8646161556243896e-05, -3.6343932151794434e-05, -3.404170274734497e-05, -3.173947334289551e-05, -2.9437243938446045e-05, -2.7135014533996582e-05, -2.483278512954712e-05, -2.2530555725097656e-05, -2.0228326320648193e-05, -1.792609691619873e-05, -1.5623867511749268e-05, -1.3321638107299805e-05, -1.1019408702850342e-05, -8.717179298400879e-06, -6.414949893951416e-06, -4.112720489501953e-06, -1.8104910850524902e-06, 4.917383193969727e-07, 2.7939677238464355e-06, 5.0961971282958984e-06, 7.398426532745361e-06, 9.700655937194824e-06, 1.2002885341644287e-05, 1.430511474609375e-05, 1.6607344150543213e-05, 1.8909573554992676e-05, 2.121180295944214e-05, 2.35140323638916e-05, 2.5816261768341064e-05, 2.8118491172790527e-05, 3.042072057723999e-05, 3.272294998168945e-05, 3.5025179386138916e-05, 3.732740879058838e-05, 3.962963819503784e-05, 4.1931867599487305e-05, 4.423409700393677e-05, 4.653632640838623e-05, 4.883855581283569e-05, 5.1140785217285156e-05, 5.344301462173462e-05, 5.574524402618408e-05, 5.8047473430633545e-05, 6.034970283508301e-05, 6.265193223953247e-05, 6.495416164398193e-05, 6.72563910484314e-05, 6.955862045288086e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 8.0, 13.0, 15.0, 24.0, 45.0, 64.0, 127.0, 225.0, 375.0, 703.0, 1347.0, 2793.0, 7239.0, 169134.0, 851375.0, 8652.0, 3056.0, 1470.0, 815.0, 426.0, 231.0, 149.0, 101.0, 56.0, 31.0, 15.0, 13.0, 16.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.91796875, -0.88134765625, -0.8447265625, -0.80810546875, -0.771484375, -0.73486328125, -0.6982421875, -0.66162109375, -0.625, -0.58837890625, -0.5517578125, -0.51513671875, -0.478515625, -0.44189453125, -0.4052734375, -0.36865234375, -0.33203125, -0.29541015625, -0.2587890625, -0.22216796875, -0.185546875, -0.14892578125, -0.1123046875, -0.07568359375, -0.0390625, -0.00244140625, 0.0341796875, 0.07080078125, 0.107421875, 0.14404296875, 0.1806640625, 0.21728515625, 0.25390625, 0.29052734375, 0.3271484375, 0.36376953125, 0.400390625, 0.43701171875, 0.4736328125, 0.51025390625, 0.546875, 0.58349609375, 0.6201171875, 0.65673828125, 0.693359375, 0.72998046875, 0.7666015625, 0.80322265625, 0.83984375, 0.87646484375, 0.9130859375, 0.94970703125, 0.986328125, 1.02294921875, 1.0595703125, 1.09619140625, 1.1328125, 1.16943359375, 1.2060546875, 1.24267578125, 1.279296875, 1.31591796875, 1.3525390625, 1.38916015625, 1.42578125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 12.0, 49.0, 171.0, 504.0, 158.0, 44.0, 9.0, 6.0, 8.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291259765625, -0.28025054931640625, -0.2692413330078125, -0.25823211669921875, -0.247222900390625, -0.23621368408203125, -0.2252044677734375, -0.21419525146484375, -0.20318603515625, -0.19217681884765625, -0.1811676025390625, -0.17015838623046875, -0.159149169921875, -0.14813995361328125, -0.1371307373046875, -0.12612152099609375, -0.1151123046875, -0.10410308837890625, -0.0930938720703125, -0.08208465576171875, -0.071075439453125, -0.06006622314453125, -0.0490570068359375, -0.03804779052734375, -0.02703857421875, -0.01602935791015625, -0.0050201416015625, 0.00598907470703125, 0.016998291015625, 0.02800750732421875, 0.0390167236328125, 0.05002593994140625, 0.06103515625, 0.07204437255859375, 0.0830535888671875, 0.09406280517578125, 0.105072021484375, 0.11608123779296875, 0.1270904541015625, 0.13809967041015625, 0.14910888671875, 0.16011810302734375, 0.1711273193359375, 0.18213653564453125, 0.193145751953125, 0.20415496826171875, 0.2151641845703125, 0.22617340087890625, 0.2371826171875, 0.24819183349609375, 0.2592010498046875, 0.27021026611328125, 0.281219482421875, 0.29222869873046875, 0.3032379150390625, 0.31424713134765625, 0.32525634765625, 0.33626556396484375, 0.3472747802734375, 0.35828399658203125, 0.369293212890625, 0.38030242919921875, 0.3913116455078125, 0.40232086181640625, 0.413330078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 30.0, 695.0, 267.0, 16.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.98137378692627, -10.730554580688477, -10.479735374450684, -10.22891616821289, -9.978097915649414, -9.727278709411621, -9.476459503173828, -9.225640296936035, -8.974821090698242, -8.72400188446045, -8.473182678222656, -8.222363471984863, -7.9715447425842285, -7.7207255363464355, -7.469906806945801, -7.219087600708008, -6.968268394470215, -6.717449188232422, -6.466629981994629, -6.215811252593994, -5.964992046356201, -5.714172840118408, -5.463354110717773, -5.2125349044799805, -4.9617156982421875, -4.7108964920043945, -4.460077285766602, -4.209258556365967, -3.958439350128174, -3.707620143890381, -3.456801176071167, -3.205982208251953, -2.9551639556884766, -2.7043447494506836, -2.4535257816314697, -2.202706813812256, -1.951887607574463, -1.7010685205459595, -1.450249433517456, -1.1994303464889526, -0.9486112594604492, -0.6977921724319458, -0.4469730854034424, -0.19615399837493896, 0.05466508865356445, 0.30548417568206787, 0.5563032627105713, 0.8071223497390747, 1.0579414367675781, 1.3087605237960815, 1.559579610824585, 1.8103986978530884, 2.061217784881592, 2.3120369911193848, 2.5628559589385986, 2.8136749267578125, 3.0644941329956055, 3.3153133392333984, 3.5661323070526123, 3.816951274871826, 4.067770481109619, 4.318589687347412, 4.569408416748047, 4.82022762298584, 5.071046829223633]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 12.0, 17.0, 38.0, 62.0, 66.0, 110.0, 113.0, 130.0, 107.0, 107.0, 92.0, 58.0, 41.0, 28.0, 5.0, 10.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.338090419769287, -2.2934646606445312, -2.2488386631011963, -2.2042129039764404, -2.1595871448516846, -2.1149611473083496, -2.0703353881835938, -2.025709629058838, -1.9810837507247925, -1.936457872390747, -1.8918321132659912, -1.8472062349319458, -1.8025803565979004, -1.7579545974731445, -1.7133287191390991, -1.6687028408050537, -1.6240770816802979, -1.5794512033462524, -1.5348254442214966, -1.4901995658874512, -1.4455738067626953, -1.40094792842865, -1.3563220500946045, -1.3116962909698486, -1.2670704126358032, -1.2224445343017578, -1.177818775177002, -1.1331928968429565, -1.0885670185089111, -1.0439412593841553, -0.9993153810501099, -0.9546895623207092, -0.9100638031959534, -0.8654379844665527, -0.8208121061325073, -0.7761862874031067, -0.731560468673706, -0.6869346499443054, -0.6423088312149048, -0.5976829528808594, -0.5530571341514587, -0.5084313154220581, -0.4638054668903351, -0.41917961835861206, -0.3745537996292114, -0.3299279808998108, -0.28530213236808777, -0.24067628383636475, -0.1960504651069641, -0.15142463147640228, -0.10679879784584045, -0.062172964215278625, -0.017547130584716797, 0.027078703045845032, 0.07170453667640686, 0.11633038520812988, 0.16095620393753052, 0.20558203756809235, 0.2502078711986542, 0.2948337197303772, 0.33945953845977783, 0.38408535718917847, 0.4287112057209015, 0.4733370542526245, 0.5179628729820251]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 7.0, 14.0, 17.0, 16.0, 17.0, 28.0, 31.0, 34.0, 52.0, 58.0, 88.0, 345.0, 57777.0, 4135214.0, 500.0, 68.0, 14.0, 1.0, 2.0], "bins": [-4.640625, -4.560752868652344, -4.4808807373046875, -4.401008605957031, -4.321136474609375, -4.241264343261719, -4.1613922119140625, -4.081520080566406, -4.00164794921875, -3.9217758178710938, -3.8419036865234375, -3.7620315551757812, -3.682159423828125, -3.6022872924804688, -3.5224151611328125, -3.4425430297851562, -3.3626708984375, -3.2827987670898438, -3.2029266357421875, -3.1230545043945312, -3.043182373046875, -2.9633102416992188, -2.8834381103515625, -2.8035659790039062, -2.72369384765625, -2.6438217163085938, -2.5639495849609375, -2.4840774536132812, -2.404205322265625, -2.3243331909179688, -2.2444610595703125, -2.1645889282226562, -2.084716796875, -2.0048446655273438, -1.9249725341796875, -1.8451004028320312, -1.765228271484375, -1.6853561401367188, -1.6054840087890625, -1.5256118774414062, -1.44573974609375, -1.3658676147460938, -1.2859954833984375, -1.2061233520507812, -1.126251220703125, -1.0463790893554688, -0.9665069580078125, -0.8866348266601562, -0.8067626953125, -0.7268905639648438, -0.6470184326171875, -0.5671463012695312, -0.487274169921875, -0.40740203857421875, -0.3275299072265625, -0.24765777587890625, -0.16778564453125, -0.08791351318359375, -0.0080413818359375, 0.07183074951171875, 0.151702880859375, 0.23157501220703125, 0.3114471435546875, 0.39131927490234375, 0.47119140625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 18.0, 66.0, 223.0, 370.0, 233.0, 91.0, 12.0, 4.0, 1.0], "bins": [-0.15185546875, -0.14925944805145264, -0.14666342735290527, -0.1440674066543579, -0.14147138595581055, -0.13887536525726318, -0.13627934455871582, -0.13368332386016846, -0.1310873031616211, -0.12849128246307373, -0.12589526176452637, -0.123299241065979, -0.12070322036743164, -0.11810719966888428, -0.11551117897033691, -0.11291515827178955, -0.11031913757324219, -0.10772311687469482, -0.10512709617614746, -0.1025310754776001, -0.09993505477905273, -0.09733903408050537, -0.09474301338195801, -0.09214699268341064, -0.08955097198486328, -0.08695495128631592, -0.08435893058776855, -0.08176290988922119, -0.07916688919067383, -0.07657086849212646, -0.0739748477935791, -0.07137882709503174, -0.06878280639648438, -0.06618678569793701, -0.06359076499938965, -0.060994744300842285, -0.05839872360229492, -0.05580270290374756, -0.053206682205200195, -0.05061066150665283, -0.04801464080810547, -0.045418620109558105, -0.04282259941101074, -0.04022657871246338, -0.037630558013916016, -0.03503453731536865, -0.03243851661682129, -0.029842495918273926, -0.027246475219726562, -0.0246504545211792, -0.022054433822631836, -0.019458413124084473, -0.01686239242553711, -0.014266371726989746, -0.011670351028442383, -0.00907433032989502, -0.006478309631347656, -0.003882288932800293, -0.0012862682342529297, 0.0013097524642944336, 0.003905773162841797, 0.00650179386138916, 0.009097814559936523, 0.011693835258483887, 0.01428985595703125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 9.0, 8.0, 8.0, 11.0, 10.0, 24.0, 26.0, 30.0, 58.0, 52.0, 71.0, 111.0, 224.0, 1246.0, 4177165.0, 14335.0, 454.0, 148.0, 78.0, 62.0, 41.0, 36.0, 14.0, 19.0, 18.0, 11.0, 9.0, 2.0, 4.0, 5.0, 2.0], "bins": [-6.1875, -6.057861328125, -5.92822265625, -5.798583984375, -5.6689453125, -5.539306640625, -5.40966796875, -5.280029296875, -5.150390625, -5.020751953125, -4.89111328125, -4.761474609375, -4.6318359375, -4.502197265625, -4.37255859375, -4.242919921875, -4.11328125, -3.983642578125, -3.85400390625, -3.724365234375, -3.5947265625, -3.465087890625, -3.33544921875, -3.205810546875, -3.076171875, -2.946533203125, -2.81689453125, -2.687255859375, -2.5576171875, -2.427978515625, -2.29833984375, -2.168701171875, -2.0390625, -1.909423828125, -1.77978515625, -1.650146484375, -1.5205078125, -1.390869140625, -1.26123046875, -1.131591796875, -1.001953125, -0.872314453125, -0.74267578125, -0.613037109375, -0.4833984375, -0.353759765625, -0.22412109375, -0.094482421875, 0.03515625, 0.164794921875, 0.29443359375, 0.424072265625, 0.5537109375, 0.683349609375, 0.81298828125, 0.942626953125, 1.072265625, 1.201904296875, 1.33154296875, 1.461181640625, 1.5908203125, 1.720458984375, 1.85009765625, 1.979736328125, 2.109375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 53.0, 3688.0, 272.0, 52.0, 11.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76904296875, -0.754180908203125, -0.73931884765625, -0.724456787109375, -0.7095947265625, -0.694732666015625, -0.67987060546875, -0.665008544921875, -0.650146484375, -0.635284423828125, -0.62042236328125, -0.605560302734375, -0.5906982421875, -0.575836181640625, -0.56097412109375, -0.546112060546875, -0.53125, -0.516387939453125, -0.50152587890625, -0.486663818359375, -0.4718017578125, -0.456939697265625, -0.44207763671875, -0.427215576171875, -0.412353515625, -0.397491455078125, -0.38262939453125, -0.367767333984375, -0.3529052734375, -0.338043212890625, -0.32318115234375, -0.308319091796875, -0.29345703125, -0.278594970703125, -0.26373291015625, -0.248870849609375, -0.2340087890625, -0.219146728515625, -0.20428466796875, -0.189422607421875, -0.174560546875, -0.159698486328125, -0.14483642578125, -0.129974365234375, -0.1151123046875, -0.100250244140625, -0.08538818359375, -0.070526123046875, -0.0556640625, -0.040802001953125, -0.02593994140625, -0.011077880859375, 0.0037841796875, 0.018646240234375, 0.03350830078125, 0.048370361328125, 0.063232421875, 0.078094482421875, 0.09295654296875, 0.107818603515625, 0.1226806640625, 0.137542724609375, 0.15240478515625, 0.167266845703125, 0.18212890625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 13.0, 25.0, 78.0, 242.0, 470.0, 118.0, 33.0, 15.0, 7.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.533083438873291, -3.4473352432250977, -3.3615870475769043, -3.275838851928711, -3.1900906562805176, -3.104342222213745, -3.0185940265655518, -2.9328458309173584, -2.847097635269165, -2.7613494396209717, -2.6756012439727783, -2.589853048324585, -2.5041046142578125, -2.418356418609619, -2.332608222961426, -2.2468600273132324, -2.161111831665039, -2.0753636360168457, -1.9896154403686523, -1.9038671255111694, -1.818118929862976, -1.7323707342147827, -1.6466224193572998, -1.5608742237091064, -1.475126028060913, -1.3893778324127197, -1.3036296367645264, -1.2178813219070435, -1.13213312625885, -1.0463849306106567, -0.9606366753578186, -0.8748884201049805, -0.789139986038208, -0.7033917903900146, -0.6176435351371765, -0.5318952798843384, -0.446147084236145, -0.3603988587856293, -0.2746506333351135, -0.1889023780822754, -0.10315418243408203, -0.017405956983566284, 0.06834226846694946, 0.1540904939174652, 0.23983871936798096, 0.3255869448184967, 0.41133517026901245, 0.4970834255218506, 0.582831621170044, 0.6685798168182373, 0.7543280720710754, 0.8400763273239136, 0.9258245229721069, 1.0115727186203003, 1.0973210334777832, 1.1830692291259766, 1.26881742477417, 1.3545656204223633, 1.4403138160705566, 1.5260621309280396, 1.611810326576233, 1.6975585222244263, 1.7833068370819092, 1.8690550327301025, 1.954803228378296]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 12.0, 26.0, 40.0, 60.0, 96.0, 130.0, 121.0, 132.0, 117.0, 110.0, 61.0, 43.0, 23.0, 14.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.7648248672485352, -1.714139699935913, -1.6634546518325806, -1.6127694845199585, -1.5620843172073364, -1.511399269104004, -1.4607141017913818, -1.4100289344787598, -1.3593437671661377, -1.3086585998535156, -1.257973551750183, -1.207288384437561, -1.156603217124939, -1.1059181690216064, -1.0552330017089844, -1.0045478343963623, -0.9538627862930298, -0.9031776785850525, -0.8524925112724304, -0.8018074035644531, -0.751122236251831, -0.7004371285438538, -0.6497520208358765, -0.5990668535232544, -0.5483817458152771, -0.4976966083049774, -0.44701147079467773, -0.39632636308670044, -0.34564122557640076, -0.2949560880661011, -0.24427098035812378, -0.1935858428478241, -0.14290082454681396, -0.09221569448709488, -0.04153056442737579, 0.009154558181762695, 0.05983969569206238, 0.11052483320236206, 0.16120994091033936, 0.21189507842063904, 0.2625802159309387, 0.3132653534412384, 0.3639504909515381, 0.4146355986595154, 0.46532073616981506, 0.5160058736801147, 0.566690981388092, 0.6173760890960693, 0.6680612564086914, 0.7187463641166687, 0.7694315314292908, 0.8201166391372681, 0.8708018064498901, 0.9214869141578674, 0.9721720218658447, 1.0228571891784668, 1.0735423564910889, 1.124227523803711, 1.1749125719070435, 1.2255977392196655, 1.2762829065322876, 1.3269679546356201, 1.3776531219482422, 1.4283382892608643, 1.4790233373641968]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 2.0, 6.0, 13.0, 9.0, 15.0, 8.0, 20.0, 21.0, 28.0, 31.0, 42.0, 65.0, 155.0, 352.0, 1049.0, 5165.0, 60779.0, 910734.0, 63057.0, 5136.0, 1110.0, 344.0, 146.0, 82.0, 41.0, 38.0, 20.0, 17.0, 17.0, 14.0, 5.0, 5.0, 10.0, 2.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.96337890625, -0.9346237182617188, -0.9058685302734375, -0.8771133422851562, -0.848358154296875, -0.8196029663085938, -0.7908477783203125, -0.7620925903320312, -0.73333740234375, -0.7045822143554688, -0.6758270263671875, -0.6470718383789062, -0.618316650390625, -0.5895614624023438, -0.5608062744140625, -0.5320510864257812, -0.5032958984375, -0.47454071044921875, -0.4457855224609375, -0.41703033447265625, -0.388275146484375, -0.35951995849609375, -0.3307647705078125, -0.30200958251953125, -0.27325439453125, -0.24449920654296875, -0.2157440185546875, -0.18698883056640625, -0.158233642578125, -0.12947845458984375, -0.1007232666015625, -0.07196807861328125, -0.043212890625, -0.01445770263671875, 0.0142974853515625, 0.04305267333984375, 0.071807861328125, 0.10056304931640625, 0.1293182373046875, 0.15807342529296875, 0.18682861328125, 0.21558380126953125, 0.2443389892578125, 0.27309417724609375, 0.301849365234375, 0.33060455322265625, 0.3593597412109375, 0.38811492919921875, 0.4168701171875, 0.44562530517578125, 0.4743804931640625, 0.5031356811523438, 0.531890869140625, 0.5606460571289062, 0.5894012451171875, 0.6181564331054688, 0.64691162109375, 0.6756668090820312, 0.7044219970703125, 0.7331771850585938, 0.761932373046875, 0.7906875610351562, 0.8194427490234375, 0.8481979370117188, 0.876953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 11.0, 20.0, 53.0, 84.0, 117.0, 168.0, 179.0, 153.0, 101.0, 62.0, 31.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.1876220703125, -0.18395423889160156, -0.18028640747070312, -0.1766185760498047, -0.17295074462890625, -0.1692829132080078, -0.16561508178710938, -0.16194725036621094, -0.1582794189453125, -0.15461158752441406, -0.15094375610351562, -0.1472759246826172, -0.14360809326171875, -0.1399402618408203, -0.13627243041992188, -0.13260459899902344, -0.128936767578125, -0.12526893615722656, -0.12160110473632812, -0.11793327331542969, -0.11426544189453125, -0.11059761047363281, -0.10692977905273438, -0.10326194763183594, -0.0995941162109375, -0.09592628479003906, -0.09225845336914062, -0.08859062194824219, -0.08492279052734375, -0.08125495910644531, -0.07758712768554688, -0.07391929626464844, -0.07025146484375, -0.06658363342285156, -0.06291580200195312, -0.05924797058105469, -0.05558013916015625, -0.05191230773925781, -0.048244476318359375, -0.04457664489746094, -0.0409088134765625, -0.03724098205566406, -0.033573150634765625, -0.029905319213867188, -0.02623748779296875, -0.022569656372070312, -0.018901824951171875, -0.015233993530273438, -0.011566162109375, -0.007898330688476562, -0.004230499267578125, -0.0005626678466796875, 0.00310516357421875, 0.0067729949951171875, 0.010440826416015625, 0.014108657836914062, 0.0177764892578125, 0.021444320678710938, 0.025112152099609375, 0.028779983520507812, 0.03244781494140625, 0.03611564636230469, 0.039783477783203125, 0.04345130920410156, 0.047119140625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 9.0, 4.0, 6.0, 14.0, 17.0, 22.0, 26.0, 54.0, 47.0, 69.0, 147.0, 270.0, 577.0, 1504.0, 6648.0, 58451.0, 820164.0, 144796.0, 11951.0, 2286.0, 676.0, 319.0, 173.0, 101.0, 73.0, 42.0, 38.0, 25.0, 12.0, 10.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5546875, -0.5391311645507812, -0.5235748291015625, -0.5080184936523438, -0.492462158203125, -0.47690582275390625, -0.4613494873046875, -0.44579315185546875, -0.43023681640625, -0.41468048095703125, -0.3991241455078125, -0.38356781005859375, -0.368011474609375, -0.35245513916015625, -0.3368988037109375, -0.32134246826171875, -0.3057861328125, -0.29022979736328125, -0.2746734619140625, -0.25911712646484375, -0.243560791015625, -0.22800445556640625, -0.2124481201171875, -0.19689178466796875, -0.18133544921875, -0.16577911376953125, -0.1502227783203125, -0.13466644287109375, -0.119110107421875, -0.10355377197265625, -0.0879974365234375, -0.07244110107421875, -0.056884765625, -0.04132843017578125, -0.0257720947265625, -0.01021575927734375, 0.005340576171875, 0.02089691162109375, 0.0364532470703125, 0.05200958251953125, 0.06756591796875, 0.08312225341796875, 0.0986785888671875, 0.11423492431640625, 0.129791259765625, 0.14534759521484375, 0.1609039306640625, 0.17646026611328125, 0.1920166015625, 0.20757293701171875, 0.2231292724609375, 0.23868560791015625, 0.254241943359375, 0.26979827880859375, 0.2853546142578125, 0.30091094970703125, 0.31646728515625, 0.33202362060546875, 0.3475799560546875, 0.36313629150390625, 0.378692626953125, 0.39424896240234375, 0.4098052978515625, 0.42536163330078125, 0.44091796875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 8.0, 6.0, 6.0, 15.0, 15.0, 18.0, 20.0, 26.0, 20.0, 20.0, 36.0, 61.0, 51.0, 51.0, 64.0, 72.0, 53.0, 67.0, 63.0, 50.0, 47.0, 38.0, 29.0, 39.0, 26.0, 22.0, 27.0, 19.0, 11.0, 5.0, 7.0, 8.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22265625, -0.21600341796875, -0.2093505859375, -0.20269775390625, -0.196044921875, -0.18939208984375, -0.1827392578125, -0.17608642578125, -0.16943359375, -0.16278076171875, -0.1561279296875, -0.14947509765625, -0.142822265625, -0.13616943359375, -0.1295166015625, -0.12286376953125, -0.1162109375, -0.10955810546875, -0.1029052734375, -0.09625244140625, -0.089599609375, -0.08294677734375, -0.0762939453125, -0.06964111328125, -0.06298828125, -0.05633544921875, -0.0496826171875, -0.04302978515625, -0.036376953125, -0.02972412109375, -0.0230712890625, -0.01641845703125, -0.009765625, -0.00311279296875, 0.0035400390625, 0.01019287109375, 0.016845703125, 0.02349853515625, 0.0301513671875, 0.03680419921875, 0.04345703125, 0.05010986328125, 0.0567626953125, 0.06341552734375, 0.070068359375, 0.07672119140625, 0.0833740234375, 0.09002685546875, 0.0966796875, 0.10333251953125, 0.1099853515625, 0.11663818359375, 0.123291015625, 0.12994384765625, 0.1365966796875, 0.14324951171875, 0.14990234375, 0.15655517578125, 0.1632080078125, 0.16986083984375, 0.176513671875, 0.18316650390625, 0.1898193359375, 0.19647216796875, 0.203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 12.0, 10.0, 21.0, 17.0, 27.0, 52.0, 120.0, 244.0, 609.0, 2070.0, 10720.0, 138886.0, 853403.0, 35743.0, 4693.0, 1107.0, 392.0, 161.0, 97.0, 53.0, 39.0, 23.0, 14.0, 11.0, 5.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.345703125, -0.334991455078125, -0.32427978515625, -0.313568115234375, -0.3028564453125, -0.292144775390625, -0.28143310546875, -0.270721435546875, -0.260009765625, -0.249298095703125, -0.23858642578125, -0.227874755859375, -0.2171630859375, -0.206451416015625, -0.19573974609375, -0.185028076171875, -0.17431640625, -0.163604736328125, -0.15289306640625, -0.142181396484375, -0.1314697265625, -0.120758056640625, -0.11004638671875, -0.099334716796875, -0.088623046875, -0.077911376953125, -0.06719970703125, -0.056488037109375, -0.0457763671875, -0.035064697265625, -0.02435302734375, -0.013641357421875, -0.0029296875, 0.007781982421875, 0.01849365234375, 0.029205322265625, 0.0399169921875, 0.050628662109375, 0.06134033203125, 0.072052001953125, 0.082763671875, 0.093475341796875, 0.10418701171875, 0.114898681640625, 0.1256103515625, 0.136322021484375, 0.14703369140625, 0.157745361328125, 0.16845703125, 0.179168701171875, 0.18988037109375, 0.200592041015625, 0.2113037109375, 0.222015380859375, 0.23272705078125, 0.243438720703125, 0.254150390625, 0.264862060546875, 0.27557373046875, 0.286285400390625, 0.2969970703125, 0.307708740234375, 0.31842041015625, 0.329132080078125, 0.33984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 6.0, 1.0, 7.0, 11.0, 9.0, 24.0, 58.0, 123.0, 268.0, 271.0, 125.0, 48.0, 24.0, 11.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-9.626150131225586e-05, -9.396951645612717e-05, -9.167753159999847e-05, -8.938554674386978e-05, -8.709356188774109e-05, -8.48015770316124e-05, -8.25095921754837e-05, -8.021760731935501e-05, -7.792562246322632e-05, -7.563363760709763e-05, -7.334165275096893e-05, -7.104966789484024e-05, -6.875768303871155e-05, -6.646569818258286e-05, -6.417371332645416e-05, -6.188172847032547e-05, -5.958974361419678e-05, -5.7297758758068085e-05, -5.500577390193939e-05, -5.27137890458107e-05, -5.042180418968201e-05, -4.8129819333553314e-05, -4.583783447742462e-05, -4.354584962129593e-05, -4.1253864765167236e-05, -3.8961879909038544e-05, -3.666989505290985e-05, -3.437791019678116e-05, -3.2085925340652466e-05, -2.9793940484523773e-05, -2.750195562839508e-05, -2.5209970772266388e-05, -2.2917985916137695e-05, -2.0626001060009003e-05, -1.833401620388031e-05, -1.6042031347751617e-05, -1.3750046491622925e-05, -1.1458061635494232e-05, -9.16607677936554e-06, -6.874091923236847e-06, -4.582107067108154e-06, -2.2901222109794617e-06, 1.862645149230957e-09, 2.2938475012779236e-06, 4.585832357406616e-06, 6.877817213535309e-06, 9.169802069664001e-06, 1.1461786925792694e-05, 1.3753771781921387e-05, 1.604575663805008e-05, 1.8337741494178772e-05, 2.0629726350307465e-05, 2.2921711206436157e-05, 2.521369606256485e-05, 2.7505680918693542e-05, 2.9797665774822235e-05, 3.208965063095093e-05, 3.438163548707962e-05, 3.667362034320831e-05, 3.8965605199337006e-05, 4.12575900554657e-05, 4.354957491159439e-05, 4.5841559767723083e-05, 4.8133544623851776e-05, 5.042552947998047e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 5.0, 6.0, 4.0, 11.0, 13.0, 17.0, 15.0, 36.0, 59.0, 66.0, 144.0, 250.0, 449.0, 1091.0, 3020.0, 13443.0, 238869.0, 759405.0, 24863.0, 4269.0, 1346.0, 546.0, 246.0, 148.0, 81.0, 43.0, 47.0, 27.0, 6.0, 13.0, 10.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5162506103515625, -0.502716064453125, -0.4891815185546875, -0.47564697265625, -0.4621124267578125, -0.448577880859375, -0.4350433349609375, -0.4215087890625, -0.4079742431640625, -0.394439697265625, -0.3809051513671875, -0.36737060546875, -0.3538360595703125, -0.340301513671875, -0.3267669677734375, -0.313232421875, -0.2996978759765625, -0.286163330078125, -0.2726287841796875, -0.25909423828125, -0.2455596923828125, -0.232025146484375, -0.2184906005859375, -0.2049560546875, -0.1914215087890625, -0.177886962890625, -0.1643524169921875, -0.15081787109375, -0.1372833251953125, -0.123748779296875, -0.1102142333984375, -0.0966796875, -0.0831451416015625, -0.069610595703125, -0.0560760498046875, -0.04254150390625, -0.0290069580078125, -0.015472412109375, -0.0019378662109375, 0.0115966796875, 0.0251312255859375, 0.038665771484375, 0.0522003173828125, 0.06573486328125, 0.0792694091796875, 0.092803955078125, 0.1063385009765625, 0.119873046875, 0.1334075927734375, 0.146942138671875, 0.1604766845703125, 0.17401123046875, 0.1875457763671875, 0.201080322265625, 0.2146148681640625, 0.2281494140625, 0.2416839599609375, 0.255218505859375, 0.2687530517578125, 0.28228759765625, 0.2958221435546875, 0.309356689453125, 0.3228912353515625, 0.33642578125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 14.0, 14.0, 15.0, 25.0, 40.0, 71.0, 93.0, 148.0, 193.0, 145.0, 84.0, 59.0, 33.0, 23.0, 19.0, 12.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2451171875, -0.23903656005859375, -0.2329559326171875, -0.22687530517578125, -0.220794677734375, -0.21471405029296875, -0.2086334228515625, -0.20255279541015625, -0.19647216796875, -0.19039154052734375, -0.1843109130859375, -0.17823028564453125, -0.172149658203125, -0.16606903076171875, -0.1599884033203125, -0.15390777587890625, -0.1478271484375, -0.14174652099609375, -0.1356658935546875, -0.12958526611328125, -0.123504638671875, -0.11742401123046875, -0.1113433837890625, -0.10526275634765625, -0.09918212890625, -0.09310150146484375, -0.0870208740234375, -0.08094024658203125, -0.074859619140625, -0.06877899169921875, -0.0626983642578125, -0.05661773681640625, -0.050537109375, -0.04445648193359375, -0.0383758544921875, -0.03229522705078125, -0.026214599609375, -0.02013397216796875, -0.0140533447265625, -0.00797271728515625, -0.00189208984375, 0.00418853759765625, 0.0102691650390625, 0.01634979248046875, 0.022430419921875, 0.02851104736328125, 0.0345916748046875, 0.04067230224609375, 0.0467529296875, 0.05283355712890625, 0.0589141845703125, 0.06499481201171875, 0.071075439453125, 0.07715606689453125, 0.0832366943359375, 0.08931732177734375, 0.09539794921875, 0.10147857666015625, 0.1075592041015625, 0.11363983154296875, 0.119720458984375, 0.12580108642578125, 0.1318817138671875, 0.13796234130859375, 0.14404296875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 13.0, 55.0, 376.0, 465.0, 74.0, 19.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2755889892578125, -4.111359119415283, -3.947129249572754, -3.7828996181488037, -3.6186697483062744, -3.454439878463745, -3.290210247039795, -3.1259803771972656, -2.9617505073547363, -2.797520637512207, -2.6332907676696777, -2.4690611362457275, -2.3048312664031982, -2.140601396560669, -1.9763716459274292, -1.8121418952941895, -1.6479120254516602, -1.4836821556091309, -1.3194524049758911, -1.1552226543426514, -0.9909927845001221, -0.8267629742622375, -0.662533164024353, -0.4983034133911133, -0.334073543548584, -0.16984373331069946, -0.005613923072814941, 0.15861588716506958, 0.3228456974029541, 0.4870755076408386, 0.6513053178787231, 0.8155350685119629, 0.9797649383544922, 1.1439948081970215, 1.3082245588302612, 1.472454309463501, 1.6366841793060303, 1.8009140491485596, 1.9651437997817993, 2.129373550415039, 2.2936034202575684, 2.4578332901000977, 2.622063159942627, 2.786292791366577, 2.9505226612091064, 3.1147525310516357, 3.278982162475586, 3.4432120323181152, 3.6074419021606445, 3.771671772003174, 3.935901641845703, 4.100131511688232, 4.264361381530762, 4.428590774536133, 4.592820644378662, 4.757050514221191, 4.921280384063721, 5.08551025390625, 5.249740123748779, 5.413969993591309, 5.57819938659668, 5.742429256439209, 5.906659126281738, 6.070888996124268, 6.235118865966797]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 9.0, 13.0, 10.0, 18.0, 15.0, 20.0, 15.0, 29.0, 29.0, 39.0, 45.0, 37.0, 35.0, 55.0, 47.0, 52.0, 50.0, 49.0, 60.0, 41.0, 34.0, 44.0, 31.0, 31.0, 30.0, 25.0, 27.0, 20.0, 7.0, 14.0, 16.0, 6.0, 10.0, 3.0, 2.0, 5.0, 0.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0], "bins": [-1.2468233108520508, -1.2118947505950928, -1.1769661903381348, -1.1420376300811768, -1.1071090698242188, -1.0721803903579712, -1.0372518301010132, -1.0023232698440552, -0.9673947095870972, -0.9324661493301392, -0.8975375890731812, -0.8626089692115784, -0.8276804089546204, -0.7927518486976624, -0.7578232288360596, -0.7228946685791016, -0.6879661083221436, -0.6530375480651855, -0.6181089878082275, -0.5831803679466248, -0.5482518076896667, -0.5133232474327087, -0.47839465737342834, -0.44346606731414795, -0.40853750705718994, -0.37360894680023193, -0.33868035674095154, -0.30375176668167114, -0.26882320642471313, -0.23389463126659393, -0.19896605610847473, -0.16403748095035553, -0.12910878658294678, -0.09418021142482758, -0.059251636266708374, -0.024323061108589172, 0.01060551404953003, 0.04553408920764923, 0.08046266436576843, 0.11539123952388763, 0.15031981468200684, 0.18524838984012604, 0.22017696499824524, 0.25510555505752563, 0.29003411531448364, 0.32496267557144165, 0.35989126563072205, 0.39481985569000244, 0.42974841594696045, 0.46467697620391846, 0.49960556626319885, 0.5345341563224792, 0.5694627165794373, 0.6043912768363953, 0.639319896697998, 0.674248456954956, 0.7091770172119141, 0.7441055774688721, 0.7790341377258301, 0.8139627575874329, 0.8488913178443909, 0.8838198781013489, 0.9187484979629517, 0.9536770582199097, 0.9886056184768677]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 4.0, 5.0, 10.0, 5.0, 8.0, 11.0, 16.0, 14.0, 25.0, 18.0, 23.0, 43.0, 67.0, 109.0, 256.0, 662.0, 2744.0, 21615.0, 4098914.0, 63524.0, 4939.0, 880.0, 230.0, 106.0, 26.0, 15.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.521484375, -2.4717178344726562, -2.4219512939453125, -2.3721847534179688, -2.322418212890625, -2.2726516723632812, -2.2228851318359375, -2.1731185913085938, -2.12335205078125, -2.0735855102539062, -2.0238189697265625, -1.9740524291992188, -1.924285888671875, -1.8745193481445312, -1.8247528076171875, -1.7749862670898438, -1.7252197265625, -1.6754531860351562, -1.6256866455078125, -1.5759201049804688, -1.526153564453125, -1.4763870239257812, -1.4266204833984375, -1.3768539428710938, -1.32708740234375, -1.2773208618164062, -1.2275543212890625, -1.1777877807617188, -1.128021240234375, -1.0782546997070312, -1.0284881591796875, -0.9787216186523438, -0.928955078125, -0.8791885375976562, -0.8294219970703125, -0.7796554565429688, -0.729888916015625, -0.6801223754882812, -0.6303558349609375, -0.5805892944335938, -0.53082275390625, -0.48105621337890625, -0.4312896728515625, -0.38152313232421875, -0.331756591796875, -0.28199005126953125, -0.2322235107421875, -0.18245697021484375, -0.1326904296875, -0.08292388916015625, -0.0331573486328125, 0.01660919189453125, 0.066375732421875, 0.11614227294921875, 0.1659088134765625, 0.21567535400390625, 0.26544189453125, 0.31520843505859375, 0.3649749755859375, 0.41474151611328125, 0.464508056640625, 0.5142745971679688, 0.5640411376953125, 0.6138076782226562, 0.66357421875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 11.0, 22.0, 57.0, 93.0, 142.0, 167.0, 161.0, 141.0, 79.0, 72.0, 22.0, 17.0, 12.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.1815185546875, -0.17808818817138672, -0.17465782165527344, -0.17122745513916016, -0.16779708862304688, -0.1643667221069336, -0.1609363555908203, -0.15750598907470703, -0.15407562255859375, -0.15064525604248047, -0.1472148895263672, -0.1437845230102539, -0.14035415649414062, -0.13692378997802734, -0.13349342346191406, -0.13006305694580078, -0.1266326904296875, -0.12320232391357422, -0.11977195739746094, -0.11634159088134766, -0.11291122436523438, -0.1094808578491211, -0.10605049133300781, -0.10262012481689453, -0.09918975830078125, -0.09575939178466797, -0.09232902526855469, -0.0888986587524414, -0.08546829223632812, -0.08203792572021484, -0.07860755920410156, -0.07517719268798828, -0.071746826171875, -0.06831645965576172, -0.06488609313964844, -0.061455726623535156, -0.058025360107421875, -0.054594993591308594, -0.05116462707519531, -0.04773426055908203, -0.04430389404296875, -0.04087352752685547, -0.03744316101074219, -0.034012794494628906, -0.030582427978515625, -0.027152061462402344, -0.023721694946289062, -0.02029132843017578, -0.0168609619140625, -0.013430595397949219, -0.010000228881835938, -0.006569862365722656, -0.003139495849609375, 0.00029087066650390625, 0.0037212371826171875, 0.007151603698730469, 0.01058197021484375, 0.014012336730957031, 0.017442703247070312, 0.020873069763183594, 0.024303436279296875, 0.027733802795410156, 0.031164169311523438, 0.03459453582763672, 0.03802490234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 9.0, 12.0, 14.0, 20.0, 31.0, 46.0, 50.0, 89.0, 133.0, 266.0, 649.0, 2394.0, 462560.0, 3724342.0, 2525.0, 602.0, 229.0, 120.0, 70.0, 33.0, 25.0, 21.0, 19.0, 11.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.76953125, -4.66119384765625, -4.5528564453125, -4.44451904296875, -4.336181640625, -4.22784423828125, -4.1195068359375, -4.01116943359375, -3.90283203125, -3.79449462890625, -3.6861572265625, -3.57781982421875, -3.469482421875, -3.36114501953125, -3.2528076171875, -3.14447021484375, -3.0361328125, -2.92779541015625, -2.8194580078125, -2.71112060546875, -2.602783203125, -2.49444580078125, -2.3861083984375, -2.27777099609375, -2.16943359375, -2.06109619140625, -1.9527587890625, -1.84442138671875, -1.736083984375, -1.62774658203125, -1.5194091796875, -1.41107177734375, -1.302734375, -1.19439697265625, -1.0860595703125, -0.97772216796875, -0.869384765625, -0.76104736328125, -0.6527099609375, -0.54437255859375, -0.43603515625, -0.32769775390625, -0.2193603515625, -0.11102294921875, -0.002685546875, 0.10565185546875, 0.2139892578125, 0.32232666015625, 0.4306640625, 0.53900146484375, 0.6473388671875, 0.75567626953125, 0.864013671875, 0.97235107421875, 1.0806884765625, 1.18902587890625, 1.29736328125, 1.40570068359375, 1.5140380859375, 1.62237548828125, 1.730712890625, 1.83905029296875, 1.9473876953125, 2.05572509765625, 2.1640625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 11.0, 27.0, 76.0, 500.0, 3239.0, 138.0, 47.0, 22.0, 11.0, 6.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.68408203125, -0.6707286834716797, -0.6573753356933594, -0.6440219879150391, -0.6306686401367188, -0.6173152923583984, -0.6039619445800781, -0.5906085968017578, -0.5772552490234375, -0.5639019012451172, -0.5505485534667969, -0.5371952056884766, -0.5238418579101562, -0.5104885101318359, -0.4971351623535156, -0.4837818145751953, -0.470428466796875, -0.4570751190185547, -0.4437217712402344, -0.43036842346191406, -0.41701507568359375, -0.40366172790527344, -0.3903083801269531, -0.3769550323486328, -0.3636016845703125, -0.3502483367919922, -0.3368949890136719, -0.32354164123535156, -0.31018829345703125, -0.29683494567871094, -0.2834815979003906, -0.2701282501220703, -0.25677490234375, -0.2434215545654297, -0.23006820678710938, -0.21671485900878906, -0.20336151123046875, -0.19000816345214844, -0.17665481567382812, -0.1633014678955078, -0.1499481201171875, -0.1365947723388672, -0.12324142456054688, -0.10988807678222656, -0.09653472900390625, -0.08318138122558594, -0.06982803344726562, -0.05647468566894531, -0.043121337890625, -0.029767990112304688, -0.016414642333984375, -0.0030612945556640625, 0.01029205322265625, 0.023645401000976562, 0.036998748779296875, 0.05035209655761719, 0.0637054443359375, 0.07705879211425781, 0.09041213989257812, 0.10376548767089844, 0.11711883544921875, 0.13047218322753906, 0.14382553100585938, 0.1571788787841797, 0.1705322265625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 6.0, 13.0, 26.0, 38.0, 98.0, 254.0, 330.0, 146.0, 60.0, 26.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2138893604278564, -2.154564380645752, -2.0952396392822266, -2.035914659500122, -1.9765897989273071, -1.9172649383544922, -1.8579399585723877, -1.7986150979995728, -1.7392902374267578, -1.6799653768539429, -1.6206403970718384, -1.5613155364990234, -1.5019906759262085, -1.4426658153533936, -1.383340835571289, -1.3240159749984741, -1.2646911144256592, -1.2053662538528442, -1.1460412740707397, -1.0867164134979248, -1.0273915529251099, -0.9680666327476501, -0.9087417125701904, -0.8494168519973755, -0.790091872215271, -0.7307669520378113, -0.6714420914649963, -0.6121171712875366, -0.5527923107147217, -0.49346739053726196, -0.43414250016212463, -0.3748176097869873, -0.31549274921417236, -0.25616785883903503, -0.1968429684638977, -0.13751806318759918, -0.07819317281246185, -0.01886826753616333, 0.040456622838974, 0.09978151321411133, 0.15910640358924866, 0.218431293964386, 0.2777561843395233, 0.33708107471466064, 0.39640599489212036, 0.4557308852672577, 0.515055775642395, 0.57438063621521, 0.6337055563926697, 0.6930304765701294, 0.7523553371429443, 0.811680257320404, 0.871005117893219, 0.9303300380706787, 0.9896548986434937, 1.0489797592163086, 1.108304738998413, 1.167629599571228, 1.2269545793533325, 1.2862794399261475, 1.3456043004989624, 1.4049291610717773, 1.4642541408538818, 1.5235790014266968, 1.5829038619995117]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 4.0, 14.0, 11.0, 23.0, 41.0, 44.0, 71.0, 80.0, 88.0, 98.0, 104.0, 116.0, 88.0, 72.0, 50.0, 36.0, 24.0, 17.0, 17.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7556730508804321, -0.7271475195884705, -0.6986219882965088, -0.6700963973999023, -0.6415708661079407, -0.613045334815979, -0.5845198035240173, -0.5559942722320557, -0.527468740940094, -0.4989432096481323, -0.47041764855384827, -0.4418921172618866, -0.4133665859699249, -0.38484102487564087, -0.3563154935836792, -0.32778996229171753, -0.29926440119743347, -0.2707388699054718, -0.24221332371234894, -0.21368777751922607, -0.1851622462272644, -0.15663670003414154, -0.12811115384101868, -0.099585622549057, -0.07106007635593414, -0.042534537613391876, -0.014008995145559311, 0.014516547322273254, 0.04304208606481552, 0.07156762480735779, 0.10009317100048065, 0.12861870229244232, 0.15714424848556519, 0.18566979467868805, 0.21419532597064972, 0.24272087216377258, 0.27124640345573425, 0.2997719645500183, 0.32829749584198, 0.35682302713394165, 0.3853485584259033, 0.413874089717865, 0.44239965081214905, 0.4709251821041107, 0.4994507133960724, 0.5279762744903564, 0.5565018057823181, 0.5850273370742798, 0.6135529279708862, 0.6420784592628479, 0.6706039905548096, 0.699129581451416, 0.7276551127433777, 0.7561806440353394, 0.784706175327301, 0.8132317066192627, 0.8417572379112244, 0.870282769203186, 0.8988083004951477, 0.9273338317871094, 0.9558594226837158, 0.9843849539756775, 1.0129104852676392, 1.041435956954956, 1.0699615478515625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 2.0, 5.0, 14.0, 9.0, 4.0, 18.0, 23.0, 17.0, 39.0, 48.0, 61.0, 69.0, 123.0, 153.0, 247.0, 376.0, 585.0, 995.0, 2191.0, 5598.0, 17749.0, 69616.0, 385230.0, 450936.0, 82390.0, 20310.0, 6329.0, 2421.0, 1107.0, 591.0, 379.0, 255.0, 171.0, 135.0, 95.0, 57.0, 45.0, 41.0, 33.0, 21.0, 20.0, 17.0, 14.0, 5.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.390869140625, -0.3797187805175781, -0.36856842041015625, -0.3574180603027344, -0.3462677001953125, -0.3351173400878906, -0.32396697998046875, -0.3128166198730469, -0.301666259765625, -0.2905158996582031, -0.27936553955078125, -0.2682151794433594, -0.2570648193359375, -0.24591445922851562, -0.23476409912109375, -0.22361373901367188, -0.21246337890625, -0.20131301879882812, -0.19016265869140625, -0.17901229858398438, -0.1678619384765625, -0.15671157836914062, -0.14556121826171875, -0.13441085815429688, -0.123260498046875, -0.11211013793945312, -0.10095977783203125, -0.08980941772460938, -0.0786590576171875, -0.06750869750976562, -0.05635833740234375, -0.045207977294921875, -0.0340576171875, -0.022907257080078125, -0.01175689697265625, -0.000606536865234375, 0.0105438232421875, 0.021694183349609375, 0.03284454345703125, 0.043994903564453125, 0.055145263671875, 0.06629562377929688, 0.07744598388671875, 0.08859634399414062, 0.0997467041015625, 0.11089706420898438, 0.12204742431640625, 0.13319778442382812, 0.14434814453125, 0.15549850463867188, 0.16664886474609375, 0.17779922485351562, 0.1889495849609375, 0.20009994506835938, 0.21125030517578125, 0.22240066528320312, 0.233551025390625, 0.24470138549804688, 0.25585174560546875, 0.2670021057128906, 0.2781524658203125, 0.2893028259277344, 0.30045318603515625, 0.3116035461425781, 0.32275390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 4.0, 3.0, 8.0, 17.0, 18.0, 30.0, 49.0, 55.0, 74.0, 98.0, 99.0, 87.0, 110.0, 75.0, 86.0, 60.0, 41.0, 32.0, 20.0, 11.0, 10.0, 4.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.096435546875, -0.09410381317138672, -0.09177207946777344, -0.08944034576416016, -0.08710861206054688, -0.0847768783569336, -0.08244514465332031, -0.08011341094970703, -0.07778167724609375, -0.07544994354248047, -0.07311820983886719, -0.0707864761352539, -0.06845474243164062, -0.06612300872802734, -0.06379127502441406, -0.06145954132080078, -0.0591278076171875, -0.05679607391357422, -0.05446434020996094, -0.052132606506347656, -0.049800872802734375, -0.047469139099121094, -0.04513740539550781, -0.04280567169189453, -0.04047393798828125, -0.03814220428466797, -0.03581047058105469, -0.033478736877441406, -0.031147003173828125, -0.028815269470214844, -0.026483535766601562, -0.02415180206298828, -0.021820068359375, -0.01948833465576172, -0.017156600952148438, -0.014824867248535156, -0.012493133544921875, -0.010161399841308594, -0.007829666137695312, -0.005497932434082031, -0.00316619873046875, -0.0008344650268554688, 0.0014972686767578125, 0.0038290023803710938, 0.006160736083984375, 0.008492469787597656, 0.010824203491210938, 0.013155937194824219, 0.0154876708984375, 0.01781940460205078, 0.020151138305664062, 0.022482872009277344, 0.024814605712890625, 0.027146339416503906, 0.029478073120117188, 0.03180980682373047, 0.03414154052734375, 0.03647327423095703, 0.03880500793457031, 0.041136741638183594, 0.043468475341796875, 0.045800209045410156, 0.04813194274902344, 0.05046367645263672, 0.05279541015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 4.0, 4.0, 8.0, 14.0, 19.0, 30.0, 40.0, 54.0, 84.0, 153.0, 192.0, 333.0, 637.0, 1292.0, 3258.0, 10280.0, 42855.0, 252636.0, 586927.0, 116417.0, 22942.0, 6107.0, 2142.0, 943.0, 427.0, 261.0, 152.0, 93.0, 66.0, 43.0, 34.0, 29.0, 19.0, 14.0, 16.0, 3.0, 13.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.29248046875, -0.2828254699707031, -0.27317047119140625, -0.2635154724121094, -0.2538604736328125, -0.24420547485351562, -0.23455047607421875, -0.22489547729492188, -0.215240478515625, -0.20558547973632812, -0.19593048095703125, -0.18627548217773438, -0.1766204833984375, -0.16696548461914062, -0.15731048583984375, -0.14765548706054688, -0.13800048828125, -0.12834548950195312, -0.11869049072265625, -0.10903549194335938, -0.0993804931640625, -0.08972549438476562, -0.08007049560546875, -0.07041549682617188, -0.060760498046875, -0.051105499267578125, -0.04145050048828125, -0.031795501708984375, -0.0221405029296875, -0.012485504150390625, -0.00283050537109375, 0.006824493408203125, 0.0164794921875, 0.026134490966796875, 0.03578948974609375, 0.045444488525390625, 0.0550994873046875, 0.06475448608398438, 0.07440948486328125, 0.08406448364257812, 0.093719482421875, 0.10337448120117188, 0.11302947998046875, 0.12268447875976562, 0.1323394775390625, 0.14199447631835938, 0.15164947509765625, 0.16130447387695312, 0.17095947265625, 0.18061447143554688, 0.19026947021484375, 0.19992446899414062, 0.2095794677734375, 0.21923446655273438, 0.22888946533203125, 0.23854446411132812, 0.248199462890625, 0.2578544616699219, 0.26750946044921875, 0.2771644592285156, 0.2868194580078125, 0.2964744567871094, 0.30612945556640625, 0.3157844543457031, 0.325439453125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 5.0, 10.0, 7.0, 7.0, 18.0, 22.0, 28.0, 29.0, 26.0, 29.0, 30.0, 37.0, 34.0, 38.0, 50.0, 46.0, 50.0, 57.0, 46.0, 52.0, 46.0, 45.0, 40.0, 38.0, 37.0, 31.0, 25.0, 15.0, 14.0, 17.0, 16.0, 9.0, 10.0, 4.0, 12.0, 6.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1680908203125, -0.16225051879882812, -0.15641021728515625, -0.15056991577148438, -0.1447296142578125, -0.13888931274414062, -0.13304901123046875, -0.12720870971679688, -0.121368408203125, -0.11552810668945312, -0.10968780517578125, -0.10384750366210938, -0.0980072021484375, -0.09216690063476562, -0.08632659912109375, -0.08048629760742188, -0.07464599609375, -0.06880569458007812, -0.06296539306640625, -0.057125091552734375, -0.0512847900390625, -0.045444488525390625, -0.03960418701171875, -0.033763885498046875, -0.027923583984375, -0.022083282470703125, -0.01624298095703125, -0.010402679443359375, -0.0045623779296875, 0.001277923583984375, 0.00711822509765625, 0.012958526611328125, 0.018798828125, 0.024639129638671875, 0.03047943115234375, 0.036319732666015625, 0.0421600341796875, 0.048000335693359375, 0.05384063720703125, 0.059680938720703125, 0.065521240234375, 0.07136154174804688, 0.07720184326171875, 0.08304214477539062, 0.0888824462890625, 0.09472274780273438, 0.10056304931640625, 0.10640335083007812, 0.11224365234375, 0.11808395385742188, 0.12392425537109375, 0.12976455688476562, 0.1356048583984375, 0.14144515991210938, 0.14728546142578125, 0.15312576293945312, 0.158966064453125, 0.16480636596679688, 0.17064666748046875, 0.17648696899414062, 0.1823272705078125, 0.18816757202148438, 0.19400787353515625, 0.19984817504882812, 0.2056884765625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 7.0, 10.0, 7.0, 14.0, 24.0, 43.0, 70.0, 162.0, 335.0, 973.0, 3426.0, 17032.0, 249448.0, 730329.0, 38501.0, 5786.0, 1435.0, 502.0, 213.0, 95.0, 57.0, 39.0, 19.0, 9.0, 9.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.1552906036376953, -0.14859390258789062, -0.14189720153808594, -0.13520050048828125, -0.12850379943847656, -0.12180709838867188, -0.11511039733886719, -0.1084136962890625, -0.10171699523925781, -0.09502029418945312, -0.08832359313964844, -0.08162689208984375, -0.07493019104003906, -0.06823348999023438, -0.06153678894042969, -0.054840087890625, -0.04814338684082031, -0.041446685791015625, -0.03474998474121094, -0.02805328369140625, -0.021356582641601562, -0.014659881591796875, -0.007963180541992188, -0.0012664794921875, 0.0054302215576171875, 0.012126922607421875, 0.018823623657226562, 0.02552032470703125, 0.03221702575683594, 0.038913726806640625, 0.04561042785644531, 0.05230712890625, 0.05900382995605469, 0.06570053100585938, 0.07239723205566406, 0.07909393310546875, 0.08579063415527344, 0.09248733520507812, 0.09918403625488281, 0.1058807373046875, 0.11257743835449219, 0.11927413940429688, 0.12597084045410156, 0.13266754150390625, 0.13936424255371094, 0.14606094360351562, 0.1527576446533203, 0.159454345703125, 0.1661510467529297, 0.17284774780273438, 0.17954444885253906, 0.18624114990234375, 0.19293785095214844, 0.19963455200195312, 0.2063312530517578, 0.2130279541015625, 0.2197246551513672, 0.22642135620117188, 0.23311805725097656, 0.23981475830078125, 0.24651145935058594, 0.2532081604003906, 0.2599048614501953, 0.2666015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 1.0, 7.0, 6.0, 3.0, 5.0, 14.0, 21.0, 15.0, 43.0, 42.0, 67.0, 65.0, 87.0, 117.0, 106.0, 80.0, 81.0, 64.0, 36.0, 34.0, 20.0, 17.0, 14.0, 9.0, 5.0, 7.0, 6.0, 3.0, 5.0, 5.0, 0.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8656253814697266e-05, -1.8013641238212585e-05, -1.7371028661727905e-05, -1.6728416085243225e-05, -1.6085803508758545e-05, -1.5443190932273865e-05, -1.4800578355789185e-05, -1.4157965779304504e-05, -1.3515353202819824e-05, -1.2872740626335144e-05, -1.2230128049850464e-05, -1.1587515473365784e-05, -1.0944902896881104e-05, -1.0302290320396423e-05, -9.659677743911743e-06, -9.017065167427063e-06, -8.374452590942383e-06, -7.731840014457703e-06, -7.0892274379730225e-06, -6.446614861488342e-06, -5.804002285003662e-06, -5.161389708518982e-06, -4.518777132034302e-06, -3.876164555549622e-06, -3.2335519790649414e-06, -2.5909394025802612e-06, -1.948326826095581e-06, -1.3057142496109009e-06, -6.631016731262207e-07, -2.0489096641540527e-08, 6.221234798431396e-07, 1.2647360563278198e-06, 1.9073486328125e-06, 2.54996120929718e-06, 3.1925737857818604e-06, 3.8351863622665405e-06, 4.477798938751221e-06, 5.120411515235901e-06, 5.763024091720581e-06, 6.405636668205261e-06, 7.048249244689941e-06, 7.690861821174622e-06, 8.333474397659302e-06, 8.976086974143982e-06, 9.618699550628662e-06, 1.0261312127113342e-05, 1.0903924703598022e-05, 1.1546537280082703e-05, 1.2189149856567383e-05, 1.2831762433052063e-05, 1.3474375009536743e-05, 1.4116987586021423e-05, 1.4759600162506104e-05, 1.5402212738990784e-05, 1.6044825315475464e-05, 1.6687437891960144e-05, 1.7330050468444824e-05, 1.7972663044929504e-05, 1.8615275621414185e-05, 1.9257888197898865e-05, 1.9900500774383545e-05, 2.0543113350868225e-05, 2.1185725927352905e-05, 2.1828338503837585e-05, 2.2470951080322266e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 5.0, 12.0, 14.0, 24.0, 49.0, 66.0, 80.0, 205.0, 457.0, 1191.0, 3963.0, 17771.0, 137731.0, 777399.0, 91097.0, 13488.0, 3244.0, 981.0, 378.0, 158.0, 87.0, 52.0, 30.0, 31.0, 9.0, 4.0, 7.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1488037109375, -0.14270973205566406, -0.13661575317382812, -0.1305217742919922, -0.12442779541015625, -0.11833381652832031, -0.11223983764648438, -0.10614585876464844, -0.1000518798828125, -0.09395790100097656, -0.08786392211914062, -0.08176994323730469, -0.07567596435546875, -0.06958198547363281, -0.06348800659179688, -0.05739402770996094, -0.051300048828125, -0.04520606994628906, -0.039112091064453125, -0.03301811218261719, -0.02692413330078125, -0.020830154418945312, -0.014736175537109375, -0.008642196655273438, -0.0025482177734375, 0.0035457611083984375, 0.009639739990234375, 0.015733718872070312, 0.02182769775390625, 0.027921676635742188, 0.034015655517578125, 0.04010963439941406, 0.04620361328125, 0.05229759216308594, 0.058391571044921875, 0.06448554992675781, 0.07057952880859375, 0.07667350769042969, 0.08276748657226562, 0.08886146545410156, 0.0949554443359375, 0.10104942321777344, 0.10714340209960938, 0.11323738098144531, 0.11933135986328125, 0.1254253387451172, 0.13151931762695312, 0.13761329650878906, 0.143707275390625, 0.14980125427246094, 0.15589523315429688, 0.1619892120361328, 0.16808319091796875, 0.1741771697998047, 0.18027114868164062, 0.18636512756347656, 0.1924591064453125, 0.19855308532714844, 0.20464706420898438, 0.2107410430908203, 0.21683502197265625, 0.2229290008544922, 0.22902297973632812, 0.23511695861816406, 0.2412109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 5.0, 3.0, 3.0, 8.0, 8.0, 5.0, 13.0, 16.0, 23.0, 36.0, 37.0, 43.0, 83.0, 86.0, 104.0, 112.0, 105.0, 84.0, 69.0, 38.0, 28.0, 21.0, 15.0, 17.0, 13.0, 8.0, 6.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08108043670654297, -0.07799339294433594, -0.0749063491821289, -0.07181930541992188, -0.06873226165771484, -0.06564521789550781, -0.06255817413330078, -0.05947113037109375, -0.05638408660888672, -0.05329704284667969, -0.050209999084472656, -0.047122955322265625, -0.044035911560058594, -0.04094886779785156, -0.03786182403564453, -0.0347747802734375, -0.03168773651123047, -0.028600692749023438, -0.025513648986816406, -0.022426605224609375, -0.019339561462402344, -0.016252517700195312, -0.013165473937988281, -0.01007843017578125, -0.006991386413574219, -0.0039043426513671875, -0.0008172988891601562, 0.002269744873046875, 0.005356788635253906, 0.008443832397460938, 0.011530876159667969, 0.014617919921875, 0.01770496368408203, 0.020792007446289062, 0.023879051208496094, 0.026966094970703125, 0.030053138732910156, 0.03314018249511719, 0.03622722625732422, 0.03931427001953125, 0.04240131378173828, 0.04548835754394531, 0.048575401306152344, 0.051662445068359375, 0.054749488830566406, 0.05783653259277344, 0.06092357635498047, 0.0640106201171875, 0.06709766387939453, 0.07018470764160156, 0.0732717514038086, 0.07635879516601562, 0.07944583892822266, 0.08253288269042969, 0.08561992645263672, 0.08870697021484375, 0.09179401397705078, 0.09488105773925781, 0.09796810150146484, 0.10105514526367188, 0.1041421890258789, 0.10722923278808594, 0.11031627655029297, 0.1134033203125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 6.0, 16.0, 79.0, 380.0, 406.0, 101.0, 14.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9617555737495422, -0.8040404319763184, -0.6463253498077393, -0.48861023783683777, -0.3308951258659363, -0.17318004369735718, -0.0154649019241333, 0.14225023984909058, 0.2999653220176697, 0.45768043398857117, 0.6153955459594727, 0.7731106281280518, 0.9308257699012756, 1.08854079246521, 1.2462559938430786, 1.4039711952209473, 1.5616862773895264, 1.7194013595581055, 1.8771164417266846, 2.0348315238952637, 2.192546844482422, 2.350261688232422, 2.50797700881958, 2.665692090988159, 2.8234071731567383, 2.9811222553253174, 3.1388373374938965, 3.2965524196624756, 3.4542675018310547, 3.611982822418213, 3.769697904586792, 3.927412986755371, 4.085127830505371, 4.242843151092529, 4.400557994842529, 4.5582733154296875, 4.7159881591796875, 4.873703479766846, 5.031418323516846, 5.189133644104004, 5.346848487854004, 5.504563808441162, 5.662278652191162, 5.81999397277832, 5.97770881652832, 6.1354241371154785, 6.2931389808654785, 6.450854301452637, 6.608569622039795, 6.766284942626953, 6.923999786376953, 7.081715106964111, 7.239429950714111, 7.3971452713012695, 7.5548601150512695, 7.712575435638428, 7.870290756225586, 8.028005599975586, 8.185721397399902, 8.343436241149902, 8.501151084899902, 8.658865928649902, 8.816581726074219, 8.974296569824219, 9.132011413574219]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 5.0, 0.0, 6.0, 9.0, 7.0, 9.0, 10.0, 12.0, 18.0, 19.0, 30.0, 29.0, 34.0, 43.0, 53.0, 54.0, 56.0, 65.0, 45.0, 52.0, 42.0, 64.0, 40.0, 37.0, 39.0, 42.0, 28.0, 29.0, 24.0, 23.0, 12.0, 19.0, 9.0, 12.0, 10.0, 5.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9964937567710876, -0.9590956568717957, -0.9216975569725037, -0.8842994570732117, -0.8469013571739197, -0.8095032572746277, -0.7721052169799805, -0.7347071170806885, -0.6973090171813965, -0.6599109172821045, -0.6225128173828125, -0.5851147174835205, -0.5477166175842285, -0.5103185176849365, -0.4729204475879669, -0.4355223476886749, -0.39812421798706055, -0.36072611808776855, -0.32332801818847656, -0.28592991828918457, -0.24853183329105377, -0.21113373339176178, -0.17373564839363098, -0.136337548494339, -0.098939448595047, -0.0615413524210453, -0.02414325624704361, 0.013254836201667786, 0.05065293610095978, 0.08805103600025177, 0.12544912099838257, 0.16284722089767456, 0.20024526119232178, 0.23764336109161377, 0.27504146099090576, 0.31243956089019775, 0.34983766078948975, 0.38723576068878174, 0.42463383078575134, 0.46203193068504333, 0.4994300305843353, 0.5368281006813049, 0.5742262005805969, 0.6116243004798889, 0.6490224003791809, 0.6864205002784729, 0.7238186001777649, 0.7612167000770569, 0.7986147999763489, 0.8360128998756409, 0.8734109997749329, 0.9108090996742249, 0.9482071995735168, 0.9856052994728088, 1.023003339767456, 1.060401439666748, 1.09779953956604, 1.135197639465332, 1.172595739364624, 1.209993839263916, 1.247391939163208, 1.2847900390625, 1.322188138961792, 1.359586238861084, 1.396984338760376]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 2.0, 5.0, 10.0, 13.0, 15.0, 29.0, 36.0, 33.0, 53.0, 86.0, 153.0, 227.0, 411.0, 853.0, 1979.0, 5907.0, 34367.0, 4058308.0, 78138.0, 8928.0, 2673.0, 1036.0, 456.0, 238.0, 119.0, 71.0, 42.0, 30.0, 14.0, 13.0, 8.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97021484375, -0.9429855346679688, -0.9157562255859375, -0.8885269165039062, -0.861297607421875, -0.8340682983398438, -0.8068389892578125, -0.7796096801757812, -0.75238037109375, -0.7251510620117188, -0.6979217529296875, -0.6706924438476562, -0.643463134765625, -0.6162338256835938, -0.5890045166015625, -0.5617752075195312, -0.5345458984375, -0.5073165893554688, -0.4800872802734375, -0.45285797119140625, -0.425628662109375, -0.39839935302734375, -0.3711700439453125, -0.34394073486328125, -0.31671142578125, -0.28948211669921875, -0.2622528076171875, -0.23502349853515625, -0.207794189453125, -0.18056488037109375, -0.1533355712890625, -0.12610626220703125, -0.098876953125, -0.07164764404296875, -0.0444183349609375, -0.01718902587890625, 0.010040283203125, 0.03726959228515625, 0.0644989013671875, 0.09172821044921875, 0.11895751953125, 0.14618682861328125, 0.1734161376953125, 0.20064544677734375, 0.227874755859375, 0.25510406494140625, 0.2823333740234375, 0.30956268310546875, 0.3367919921875, 0.36402130126953125, 0.3912506103515625, 0.41847991943359375, 0.445709228515625, 0.47293853759765625, 0.5001678466796875, 0.5273971557617188, 0.55462646484375, 0.5818557739257812, 0.6090850830078125, 0.6363143920898438, 0.663543701171875, 0.6907730102539062, 0.7180023193359375, 0.7452316284179688, 0.7724609375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 14.0, 18.0, 27.0, 46.0, 63.0, 69.0, 78.0, 80.0, 116.0, 92.0, 89.0, 75.0, 60.0, 47.0, 42.0, 25.0, 16.0, 9.0, 11.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0919189453125, -0.0896615982055664, -0.08740425109863281, -0.08514690399169922, -0.08288955688476562, -0.08063220977783203, -0.07837486267089844, -0.07611751556396484, -0.07386016845703125, -0.07160282135009766, -0.06934547424316406, -0.06708812713623047, -0.06483078002929688, -0.06257343292236328, -0.06031608581542969, -0.058058738708496094, -0.0558013916015625, -0.053544044494628906, -0.05128669738769531, -0.04902935028076172, -0.046772003173828125, -0.04451465606689453, -0.04225730895996094, -0.039999961853027344, -0.03774261474609375, -0.035485267639160156, -0.03322792053222656, -0.03097057342529297, -0.028713226318359375, -0.02645587921142578, -0.024198532104492188, -0.021941184997558594, -0.019683837890625, -0.017426490783691406, -0.015169143676757812, -0.012911796569824219, -0.010654449462890625, -0.008397102355957031, -0.0061397552490234375, -0.0038824081420898438, -0.00162506103515625, 0.0006322860717773438, 0.0028896331787109375, 0.005146980285644531, 0.007404327392578125, 0.009661674499511719, 0.011919021606445312, 0.014176368713378906, 0.0164337158203125, 0.018691062927246094, 0.020948410034179688, 0.02320575714111328, 0.025463104248046875, 0.02772045135498047, 0.029977798461914062, 0.032235145568847656, 0.03449249267578125, 0.036749839782714844, 0.03900718688964844, 0.04126453399658203, 0.043521881103515625, 0.04577922821044922, 0.04803657531738281, 0.050293922424316406, 0.05255126953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 10.0, 19.0, 28.0, 40.0, 76.0, 113.0, 169.0, 357.0, 819.0, 3626.0, 44571.0, 4123874.0, 17114.0, 2144.0, 613.0, 263.0, 167.0, 105.0, 70.0, 38.0, 27.0, 15.0, 10.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5888671875, -1.5426177978515625, -1.496368408203125, -1.4501190185546875, -1.40386962890625, -1.3576202392578125, -1.311370849609375, -1.2651214599609375, -1.2188720703125, -1.1726226806640625, -1.126373291015625, -1.0801239013671875, -1.03387451171875, -0.9876251220703125, -0.941375732421875, -0.8951263427734375, -0.848876953125, -0.8026275634765625, -0.756378173828125, -0.7101287841796875, -0.66387939453125, -0.6176300048828125, -0.571380615234375, -0.5251312255859375, -0.4788818359375, -0.4326324462890625, -0.386383056640625, -0.3401336669921875, -0.29388427734375, -0.2476348876953125, -0.201385498046875, -0.1551361083984375, -0.10888671875, -0.0626373291015625, -0.016387939453125, 0.0298614501953125, 0.07611083984375, 0.1223602294921875, 0.168609619140625, 0.2148590087890625, 0.2611083984375, 0.3073577880859375, 0.353607177734375, 0.3998565673828125, 0.44610595703125, 0.4923553466796875, 0.538604736328125, 0.5848541259765625, 0.631103515625, 0.6773529052734375, 0.723602294921875, 0.7698516845703125, 0.81610107421875, 0.8623504638671875, 0.908599853515625, 0.9548492431640625, 1.0010986328125, 1.0473480224609375, 1.093597412109375, 1.1398468017578125, 1.18609619140625, 1.2323455810546875, 1.278594970703125, 1.3248443603515625, 1.37109375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 10.0, 17.0, 31.0, 49.0, 168.0, 2797.0, 831.0, 82.0, 43.0, 19.0, 10.0, 6.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28955078125, -0.28168487548828125, -0.2738189697265625, -0.26595306396484375, -0.258087158203125, -0.25022125244140625, -0.2423553466796875, -0.23448944091796875, -0.22662353515625, -0.21875762939453125, -0.2108917236328125, -0.20302581787109375, -0.195159912109375, -0.18729400634765625, -0.1794281005859375, -0.17156219482421875, -0.1636962890625, -0.15583038330078125, -0.1479644775390625, -0.14009857177734375, -0.132232666015625, -0.12436676025390625, -0.1165008544921875, -0.10863494873046875, -0.10076904296875, -0.09290313720703125, -0.0850372314453125, -0.07717132568359375, -0.069305419921875, -0.06143951416015625, -0.0535736083984375, -0.04570770263671875, -0.037841796875, -0.02997589111328125, -0.0221099853515625, -0.01424407958984375, -0.006378173828125, 0.00148773193359375, 0.0093536376953125, 0.01721954345703125, 0.02508544921875, 0.03295135498046875, 0.0408172607421875, 0.04868316650390625, 0.056549072265625, 0.06441497802734375, 0.0722808837890625, 0.08014678955078125, 0.0880126953125, 0.09587860107421875, 0.1037445068359375, 0.11161041259765625, 0.119476318359375, 0.12734222412109375, 0.1352081298828125, 0.14307403564453125, 0.15093994140625, 0.15880584716796875, 0.1666717529296875, 0.17453765869140625, 0.182403564453125, 0.19026947021484375, 0.1981353759765625, 0.20600128173828125, 0.2138671875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 42.0, 395.0, 537.0, 29.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.736001491546631, -4.611664295196533, -4.487326622009277, -4.36298942565918, -4.238652229309082, -4.114314556121826, -3.9899773597717285, -3.8656399250030518, -3.741302490234375, -3.6169650554656982, -3.4926276206970215, -3.368290424346924, -3.243952989578247, -3.1196155548095703, -2.9952783584594727, -2.870940923690796, -2.746603488922119, -2.6222660541534424, -2.4979286193847656, -2.373591423034668, -2.249253988265991, -2.1249165534973145, -2.000579357147217, -1.87624192237854, -1.7519044876098633, -1.6275670528411865, -1.5032297372817993, -1.378892421722412, -1.2545549869537354, -1.1302175521850586, -1.0058802366256714, -0.8815428614616394, -0.7572054862976074, -0.6328681111335754, -0.5085307359695435, -0.3841933608055115, -0.2598559856414795, -0.1355186104774475, -0.011181235313415527, 0.11315613985061646, 0.23749351501464844, 0.3618308901786804, 0.4861682653427124, 0.6105056405067444, 0.7348430156707764, 0.8591803908348083, 0.9835177659988403, 1.1078550815582275, 1.2321925163269043, 1.356529951095581, 1.4808672666549683, 1.6052045822143555, 1.7295420169830322, 1.853879451751709, 1.9782167673110962, 2.1025540828704834, 2.22689151763916, 2.351228952407837, 2.4755663871765137, 2.5999035835266113, 2.724241018295288, 2.848578453063965, 2.9729156494140625, 3.0972530841827393, 3.221590518951416]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 9.0, 14.0, 17.0, 37.0, 33.0, 33.0, 41.0, 60.0, 69.0, 75.0, 61.0, 79.0, 68.0, 71.0, 74.0, 69.0, 48.0, 35.0, 27.0, 33.0, 22.0, 8.0, 6.0, 4.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35211247205734253, -0.3345228433609009, -0.31693321466445923, -0.2993435859680176, -0.2817539572715759, -0.2641643285751343, -0.24657467007637024, -0.2289850413799286, -0.21139541268348694, -0.1938057839870453, -0.17621615529060364, -0.1586265116930008, -0.14103688299655914, -0.12344725430011749, -0.10585761815309525, -0.088267982006073, -0.07067835330963135, -0.0530887208878994, -0.03549908846616745, -0.0179094560444355, -0.00031982362270355225, 0.017269805073738098, 0.034859441220760345, 0.05244907736778259, 0.07003870606422424, 0.0876283347606659, 0.10521797090768814, 0.12280760705471039, 0.14039723575115204, 0.1579868644475937, 0.17557650804519653, 0.19316613674163818, 0.21075576543807983, 0.22834539413452148, 0.24593502283096313, 0.2635246515274048, 0.28111428022384644, 0.2987039089202881, 0.3162935674190521, 0.3338831961154938, 0.3514728248119354, 0.3690624535083771, 0.3866520822048187, 0.4042417109012604, 0.4218313694000244, 0.43942099809646606, 0.4570106267929077, 0.47460025548934937, 0.492189884185791, 0.5097795128822327, 0.5273691415786743, 0.544958770275116, 0.5625483989715576, 0.5801380276679993, 0.5977276563644409, 0.6153173446655273, 0.6329069137573242, 0.6504965424537659, 0.6680861711502075, 0.6856757998466492, 0.7032654285430908, 0.7208550572395325, 0.7384446859359741, 0.7560343742370605, 0.7736240029335022]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 11.0, 14.0, 6.0, 16.0, 20.0, 34.0, 57.0, 75.0, 84.0, 142.0, 225.0, 349.0, 565.0, 1086.0, 2409.0, 6329.0, 21638.0, 102684.0, 510179.0, 322820.0, 57729.0, 13775.0, 4347.0, 1820.0, 826.0, 485.0, 280.0, 174.0, 97.0, 92.0, 52.0, 40.0, 26.0, 16.0, 14.0, 13.0, 10.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.369873046875, -0.3598289489746094, -0.34978485107421875, -0.3397407531738281, -0.3296966552734375, -0.3196525573730469, -0.30960845947265625, -0.2995643615722656, -0.289520263671875, -0.2794761657714844, -0.26943206787109375, -0.2593879699707031, -0.2493438720703125, -0.23929977416992188, -0.22925567626953125, -0.21921157836914062, -0.20916748046875, -0.19912338256835938, -0.18907928466796875, -0.17903518676757812, -0.1689910888671875, -0.15894699096679688, -0.14890289306640625, -0.13885879516601562, -0.128814697265625, -0.11877059936523438, -0.10872650146484375, -0.09868240356445312, -0.0886383056640625, -0.07859420776367188, -0.06855010986328125, -0.058506011962890625, -0.0484619140625, -0.038417816162109375, -0.02837371826171875, -0.018329620361328125, -0.0082855224609375, 0.001758575439453125, 0.01180267333984375, 0.021846771240234375, 0.031890869140625, 0.041934967041015625, 0.05197906494140625, 0.062023162841796875, 0.0720672607421875, 0.08211135864257812, 0.09215545654296875, 0.10219955444335938, 0.11224365234375, 0.12228775024414062, 0.13233184814453125, 0.14237594604492188, 0.1524200439453125, 0.16246414184570312, 0.17250823974609375, 0.18255233764648438, 0.192596435546875, 0.20264053344726562, 0.21268463134765625, 0.22272872924804688, 0.2327728271484375, 0.24281692504882812, 0.25286102294921875, 0.2629051208496094, 0.27294921875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 5.0, 12.0, 11.0, 10.0, 23.0, 43.0, 43.0, 73.0, 59.0, 77.0, 90.0, 78.0, 94.0, 79.0, 70.0, 68.0, 51.0, 32.0, 22.0, 26.0, 13.0, 9.0, 4.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.08685302734375, -0.08453750610351562, -0.08222198486328125, -0.07990646362304688, -0.0775909423828125, -0.07527542114257812, -0.07295989990234375, -0.07064437866210938, -0.068328857421875, -0.06601333618164062, -0.06369781494140625, -0.061382293701171875, -0.0590667724609375, -0.056751251220703125, -0.05443572998046875, -0.052120208740234375, -0.0498046875, -0.047489166259765625, -0.04517364501953125, -0.042858123779296875, -0.0405426025390625, -0.038227081298828125, -0.03591156005859375, -0.033596038818359375, -0.031280517578125, -0.028964996337890625, -0.02664947509765625, -0.024333953857421875, -0.0220184326171875, -0.019702911376953125, -0.01738739013671875, -0.015071868896484375, -0.01275634765625, -0.010440826416015625, -0.00812530517578125, -0.005809783935546875, -0.0034942626953125, -0.001178741455078125, 0.00113677978515625, 0.003452301025390625, 0.005767822265625, 0.008083343505859375, 0.01039886474609375, 0.012714385986328125, 0.0150299072265625, 0.017345428466796875, 0.01966094970703125, 0.021976470947265625, 0.0242919921875, 0.026607513427734375, 0.02892303466796875, 0.031238555908203125, 0.0335540771484375, 0.035869598388671875, 0.03818511962890625, 0.040500640869140625, 0.042816162109375, 0.045131683349609375, 0.04744720458984375, 0.049762725830078125, 0.0520782470703125, 0.054393768310546875, 0.05670928955078125, 0.059024810791015625, 0.06134033203125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 8.0, 4.0, 16.0, 17.0, 21.0, 36.0, 33.0, 49.0, 74.0, 115.0, 185.0, 303.0, 517.0, 1084.0, 2404.0, 6662.0, 23792.0, 127470.0, 614303.0, 219991.0, 36199.0, 9270.0, 3056.0, 1317.0, 605.0, 353.0, 224.0, 126.0, 103.0, 67.0, 33.0, 19.0, 29.0, 21.0, 21.0, 9.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.308837890625, -0.2990760803222656, -0.28931427001953125, -0.2795524597167969, -0.2697906494140625, -0.2600288391113281, -0.25026702880859375, -0.24050521850585938, -0.230743408203125, -0.22098159790039062, -0.21121978759765625, -0.20145797729492188, -0.1916961669921875, -0.18193435668945312, -0.17217254638671875, -0.16241073608398438, -0.15264892578125, -0.14288711547851562, -0.13312530517578125, -0.12336349487304688, -0.1136016845703125, -0.10383987426757812, -0.09407806396484375, -0.08431625366210938, -0.074554443359375, -0.06479263305664062, -0.05503082275390625, -0.045269012451171875, -0.0355072021484375, -0.025745391845703125, -0.01598358154296875, -0.006221771240234375, 0.0035400390625, 0.013301849365234375, 0.02306365966796875, 0.032825469970703125, 0.0425872802734375, 0.052349090576171875, 0.06211090087890625, 0.07187271118164062, 0.081634521484375, 0.09139633178710938, 0.10115814208984375, 0.11091995239257812, 0.1206817626953125, 0.13044357299804688, 0.14020538330078125, 0.14996719360351562, 0.15972900390625, 0.16949081420898438, 0.17925262451171875, 0.18901443481445312, 0.1987762451171875, 0.20853805541992188, 0.21829986572265625, 0.22806167602539062, 0.237823486328125, 0.24758529663085938, 0.25734710693359375, 0.2671089172363281, 0.2768707275390625, 0.2866325378417969, 0.29639434814453125, 0.3061561584472656, 0.31591796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 9.0, 8.0, 10.0, 11.0, 17.0, 23.0, 27.0, 19.0, 35.0, 47.0, 22.0, 56.0, 53.0, 51.0, 63.0, 56.0, 64.0, 59.0, 56.0, 46.0, 47.0, 39.0, 32.0, 30.0, 24.0, 13.0, 25.0, 12.0, 11.0, 5.0, 4.0, 8.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.280029296875, -0.2724494934082031, -0.26486968994140625, -0.2572898864746094, -0.2497100830078125, -0.24213027954101562, -0.23455047607421875, -0.22697067260742188, -0.219390869140625, -0.21181106567382812, -0.20423126220703125, -0.19665145874023438, -0.1890716552734375, -0.18149185180664062, -0.17391204833984375, -0.16633224487304688, -0.15875244140625, -0.15117263793945312, -0.14359283447265625, -0.13601303100585938, -0.1284332275390625, -0.12085342407226562, -0.11327362060546875, -0.10569381713867188, -0.098114013671875, -0.09053421020507812, -0.08295440673828125, -0.07537460327148438, -0.0677947998046875, -0.060214996337890625, -0.05263519287109375, -0.045055389404296875, -0.0374755859375, -0.029895782470703125, -0.02231597900390625, -0.014736175537109375, -0.0071563720703125, 0.000423431396484375, 0.00800323486328125, 0.015583038330078125, 0.023162841796875, 0.030742645263671875, 0.03832244873046875, 0.045902252197265625, 0.0534820556640625, 0.061061859130859375, 0.06864166259765625, 0.07622146606445312, 0.08380126953125, 0.09138107299804688, 0.09896087646484375, 0.10654067993164062, 0.1141204833984375, 0.12170028686523438, 0.12928009033203125, 0.13685989379882812, 0.144439697265625, 0.15201950073242188, 0.15959930419921875, 0.16717910766601562, 0.1747589111328125, 0.18233871459960938, 0.18991851806640625, 0.19749832153320312, 0.205078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 5.0, 7.0, 11.0, 9.0, 22.0, 17.0, 31.0, 44.0, 104.0, 175.0, 409.0, 1170.0, 3877.0, 20875.0, 360152.0, 623211.0, 30908.0, 5112.0, 1391.0, 544.0, 201.0, 108.0, 61.0, 40.0, 28.0, 11.0, 11.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17679214477539062, -0.16974639892578125, -0.16270065307617188, -0.1556549072265625, -0.14860916137695312, -0.14156341552734375, -0.13451766967773438, -0.127471923828125, -0.12042617797851562, -0.11338043212890625, -0.10633468627929688, -0.0992889404296875, -0.09224319458007812, -0.08519744873046875, -0.07815170288085938, -0.07110595703125, -0.06406021118164062, -0.05701446533203125, -0.049968719482421875, -0.0429229736328125, -0.035877227783203125, -0.02883148193359375, -0.021785736083984375, -0.014739990234375, -0.007694244384765625, -0.00064849853515625, 0.006397247314453125, 0.0134429931640625, 0.020488739013671875, 0.02753448486328125, 0.034580230712890625, 0.0416259765625, 0.048671722412109375, 0.05571746826171875, 0.06276321411132812, 0.0698089599609375, 0.07685470581054688, 0.08390045166015625, 0.09094619750976562, 0.097991943359375, 0.10503768920898438, 0.11208343505859375, 0.11912918090820312, 0.1261749267578125, 0.13322067260742188, 0.14026641845703125, 0.14731216430664062, 0.15435791015625, 0.16140365600585938, 0.16844940185546875, 0.17549514770507812, 0.1825408935546875, 0.18958663940429688, 0.19663238525390625, 0.20367813110351562, 0.210723876953125, 0.21776962280273438, 0.22481536865234375, 0.23186111450195312, 0.2389068603515625, 0.24595260620117188, 0.25299835205078125, 0.2600440979003906, 0.26708984375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 9.0, 4.0, 11.0, 11.0, 20.0, 30.0, 45.0, 61.0, 104.0, 148.0, 168.0, 126.0, 102.0, 62.0, 34.0, 32.0, 21.0, 9.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.202127456665039e-05, -4.107598215341568e-05, -4.013068974018097e-05, -3.918539732694626e-05, -3.824010491371155e-05, -3.729481250047684e-05, -3.6349520087242126e-05, -3.5404227674007416e-05, -3.4458935260772705e-05, -3.3513642847537994e-05, -3.2568350434303284e-05, -3.162305802106857e-05, -3.067776560783386e-05, -2.973247319459915e-05, -2.878718078136444e-05, -2.784188836812973e-05, -2.689659595489502e-05, -2.595130354166031e-05, -2.5006011128425598e-05, -2.4060718715190887e-05, -2.3115426301956177e-05, -2.2170133888721466e-05, -2.1224841475486755e-05, -2.0279549062252045e-05, -1.9334256649017334e-05, -1.8388964235782623e-05, -1.7443671822547913e-05, -1.6498379409313202e-05, -1.555308699607849e-05, -1.460779458284378e-05, -1.366250216960907e-05, -1.2717209756374359e-05, -1.1771917343139648e-05, -1.0826624929904938e-05, -9.881332516670227e-06, -8.936040103435516e-06, -7.990747690200806e-06, -7.045455276966095e-06, -6.100162863731384e-06, -5.154870450496674e-06, -4.209578037261963e-06, -3.264285624027252e-06, -2.3189932107925415e-06, -1.3737007975578308e-06, -4.284083843231201e-07, 5.168840289115906e-07, 1.4621764421463013e-06, 2.407468855381012e-06, 3.3527612686157227e-06, 4.298053681850433e-06, 5.243346095085144e-06, 6.188638508319855e-06, 7.1339309215545654e-06, 8.079223334789276e-06, 9.024515748023987e-06, 9.969808161258698e-06, 1.0915100574493408e-05, 1.1860392987728119e-05, 1.280568540096283e-05, 1.375097781419754e-05, 1.4696270227432251e-05, 1.564156264066696e-05, 1.6586855053901672e-05, 1.7532147467136383e-05, 1.8477439880371094e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 15.0, 5.0, 22.0, 40.0, 42.0, 84.0, 115.0, 183.0, 334.0, 650.0, 1296.0, 2972.0, 9266.0, 50819.0, 724554.0, 226985.0, 21789.0, 5367.0, 1946.0, 929.0, 461.0, 257.0, 136.0, 94.0, 65.0, 32.0, 30.0, 12.0, 11.0, 7.0, 6.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17626953125, -0.16915512084960938, -0.16204071044921875, -0.15492630004882812, -0.1478118896484375, -0.14069747924804688, -0.13358306884765625, -0.12646865844726562, -0.119354248046875, -0.11223983764648438, -0.10512542724609375, -0.09801101684570312, -0.0908966064453125, -0.08378219604492188, -0.07666778564453125, -0.06955337524414062, -0.06243896484375, -0.055324554443359375, -0.04821014404296875, -0.041095733642578125, -0.0339813232421875, -0.026866912841796875, -0.01975250244140625, -0.012638092041015625, -0.005523681640625, 0.001590728759765625, 0.00870513916015625, 0.015819549560546875, 0.0229339599609375, 0.030048370361328125, 0.03716278076171875, 0.044277191162109375, 0.0513916015625, 0.058506011962890625, 0.06562042236328125, 0.07273483276367188, 0.0798492431640625, 0.08696365356445312, 0.09407806396484375, 0.10119247436523438, 0.108306884765625, 0.11542129516601562, 0.12253570556640625, 0.12965011596679688, 0.1367645263671875, 0.14387893676757812, 0.15099334716796875, 0.15810775756835938, 0.16522216796875, 0.17233657836914062, 0.17945098876953125, 0.18656539916992188, 0.1936798095703125, 0.20079421997070312, 0.20790863037109375, 0.21502304077148438, 0.222137451171875, 0.22925186157226562, 0.23636627197265625, 0.24348068237304688, 0.2505950927734375, 0.2577095031738281, 0.26482391357421875, 0.2719383239746094, 0.279052734375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 9.0, 9.0, 25.0, 25.0, 35.0, 48.0, 58.0, 103.0, 129.0, 127.0, 108.0, 95.0, 65.0, 53.0, 37.0, 19.0, 18.0, 5.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09332275390625, -0.08874034881591797, -0.08415794372558594, -0.0795755386352539, -0.07499313354492188, -0.07041072845458984, -0.06582832336425781, -0.06124591827392578, -0.05666351318359375, -0.05208110809326172, -0.04749870300292969, -0.042916297912597656, -0.038333892822265625, -0.033751487731933594, -0.029169082641601562, -0.02458667755126953, -0.0200042724609375, -0.015421867370605469, -0.010839462280273438, -0.006257057189941406, -0.001674652099609375, 0.0029077529907226562, 0.0074901580810546875, 0.012072563171386719, 0.01665496826171875, 0.02123737335205078, 0.025819778442382812, 0.030402183532714844, 0.034984588623046875, 0.039566993713378906, 0.04414939880371094, 0.04873180389404297, 0.053314208984375, 0.05789661407470703, 0.06247901916503906, 0.0670614242553711, 0.07164382934570312, 0.07622623443603516, 0.08080863952636719, 0.08539104461669922, 0.08997344970703125, 0.09455585479736328, 0.09913825988769531, 0.10372066497802734, 0.10830307006835938, 0.1128854751586914, 0.11746788024902344, 0.12205028533935547, 0.1266326904296875, 0.13121509552001953, 0.13579750061035156, 0.1403799057006836, 0.14496231079101562, 0.14954471588134766, 0.1541271209716797, 0.15870952606201172, 0.16329193115234375, 0.16787433624267578, 0.1724567413330078, 0.17703914642333984, 0.18162155151367188, 0.1862039566040039, 0.19078636169433594, 0.19536876678466797, 0.199951171875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 36.0, 164.0, 513.0, 243.0, 32.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.200401306152344, -8.024381637573242, -7.848361492156982, -7.672341823577881, -7.496322154998779, -7.3203020095825195, -7.144282341003418, -6.968262672424316, -6.792243003845215, -6.616223335266113, -6.4402031898498535, -6.264183521270752, -6.08816385269165, -5.912143707275391, -5.736124038696289, -5.5601043701171875, -5.384084224700928, -5.208064556121826, -5.032044410705566, -4.856024742126465, -4.680005073547363, -4.503985404968262, -4.327965259552002, -4.1519455909729, -3.9759256839752197, -3.799905776977539, -3.6238861083984375, -3.447866201400757, -3.271846294403076, -3.0958266258239746, -2.919806718826294, -2.7437868118286133, -2.56776762008667, -2.3917477130889893, -2.2157280445098877, -2.039708137512207, -1.863688349723816, -1.6876685619354248, -1.5116486549377441, -1.335628867149353, -1.159609079360962, -0.9835892915725708, -0.8075694441795349, -0.631549596786499, -0.4555298089981079, -0.2795100212097168, -0.10349011421203613, 0.07252967357635498, 0.2485494613647461, 0.4245692789554596, 0.6005890965461731, 0.776608943939209, 0.9526287317276001, 1.1286485195159912, 1.3046684265136719, 1.480688214302063, 1.656708002090454, 1.8327277898788452, 2.0087475776672363, 2.184767484664917, 2.3607873916625977, 2.536807060241699, 2.71282696723938, 2.8888468742370605, 3.064866542816162]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 3.0, 7.0, 9.0, 19.0, 10.0, 14.0, 17.0, 15.0, 29.0, 23.0, 26.0, 34.0, 25.0, 43.0, 41.0, 45.0, 40.0, 45.0, 53.0, 47.0, 53.0, 60.0, 35.0, 46.0, 35.0, 36.0, 26.0, 36.0, 28.0, 15.0, 14.0, 17.0, 5.0, 14.0, 5.0, 6.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9388344287872314, -0.9024601578712463, -0.8660858869552612, -0.8297115564346313, -0.7933372855186462, -0.7569630146026611, -0.7205886840820312, -0.6842144131660461, -0.647840142250061, -0.6114658713340759, -0.5750916004180908, -0.5387172698974609, -0.5023429989814758, -0.4659687280654907, -0.4295944273471832, -0.39322012662887573, -0.3568458557128906, -0.3204715847969055, -0.284097284078598, -0.24772299826145172, -0.21134871244430542, -0.17497442662715912, -0.13860014081001282, -0.10222584009170532, -0.06585156917572021, -0.029477283358573914, 0.006897002458572388, 0.04327128827571869, 0.07964557409286499, 0.11601985991001129, 0.1523941457271576, 0.1887684464454651, 0.22514259815216064, 0.26151686906814575, 0.29789116978645325, 0.33426547050476074, 0.37063974142074585, 0.40701401233673096, 0.44338831305503845, 0.47976261377334595, 0.516136884689331, 0.5525111556053162, 0.5888854265213013, 0.6252597570419312, 0.6616340279579163, 0.6980082988739014, 0.7343826293945312, 0.7707569003105164, 0.8071311712265015, 0.8435054421424866, 0.8798797130584717, 0.9162540435791016, 0.9526283144950867, 0.9890025854110718, 1.0253769159317017, 1.061751127243042, 1.0981254577636719, 1.1344997882843018, 1.170873999595642, 1.207248330116272, 1.2436225414276123, 1.2799968719482422, 1.316371202468872, 1.352745532989502, 1.3891197443008423]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 11.0, 9.0, 12.0, 18.0, 26.0, 26.0, 50.0, 52.0, 69.0, 140.0, 175.0, 313.0, 534.0, 1031.0, 2229.0, 5813.0, 20189.0, 160360.0, 3892401.0, 86044.0, 15755.0, 5075.0, 1982.0, 910.0, 464.0, 221.0, 141.0, 81.0, 42.0, 31.0, 13.0, 13.0, 6.0, 12.0, 5.0, 0.0, 4.0, 2.0, 3.0, 0.0, 4.0], "bins": [-0.7197265625, -0.7023391723632812, -0.6849517822265625, -0.6675643920898438, -0.650177001953125, -0.6327896118164062, -0.6154022216796875, -0.5980148315429688, -0.58062744140625, -0.5632400512695312, -0.5458526611328125, -0.5284652709960938, -0.511077880859375, -0.49369049072265625, -0.4763031005859375, -0.45891571044921875, -0.4415283203125, -0.42414093017578125, -0.4067535400390625, -0.38936614990234375, -0.371978759765625, -0.35459136962890625, -0.3372039794921875, -0.31981658935546875, -0.30242919921875, -0.28504180908203125, -0.2676544189453125, -0.25026702880859375, -0.232879638671875, -0.21549224853515625, -0.1981048583984375, -0.18071746826171875, -0.163330078125, -0.14594268798828125, -0.1285552978515625, -0.11116790771484375, -0.093780517578125, -0.07639312744140625, -0.0590057373046875, -0.04161834716796875, -0.02423095703125, -0.00684356689453125, 0.0105438232421875, 0.02793121337890625, 0.045318603515625, 0.06270599365234375, 0.0800933837890625, 0.09748077392578125, 0.1148681640625, 0.13225555419921875, 0.1496429443359375, 0.16703033447265625, 0.184417724609375, 0.20180511474609375, 0.2191925048828125, 0.23657989501953125, 0.25396728515625, 0.27135467529296875, 0.2887420654296875, 0.30612945556640625, 0.323516845703125, 0.34090423583984375, 0.3582916259765625, 0.37567901611328125, 0.39306640625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 1.0, 7.0, 8.0, 9.0, 19.0, 35.0, 41.0, 34.0, 63.0, 81.0, 87.0, 86.0, 82.0, 73.0, 84.0, 74.0, 48.0, 46.0, 35.0, 26.0, 25.0, 12.0, 5.0, 9.0, 6.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08294677734375, -0.08072853088378906, -0.07851028442382812, -0.07629203796386719, -0.07407379150390625, -0.07185554504394531, -0.06963729858398438, -0.06741905212402344, -0.0652008056640625, -0.06298255920410156, -0.060764312744140625, -0.05854606628417969, -0.05632781982421875, -0.05410957336425781, -0.051891326904296875, -0.04967308044433594, -0.047454833984375, -0.04523658752441406, -0.043018341064453125, -0.04080009460449219, -0.03858184814453125, -0.03636360168457031, -0.034145355224609375, -0.03192710876464844, -0.0297088623046875, -0.027490615844726562, -0.025272369384765625, -0.023054122924804688, -0.02083587646484375, -0.018617630004882812, -0.016399383544921875, -0.014181137084960938, -0.011962890625, -0.009744644165039062, -0.007526397705078125, -0.0053081512451171875, -0.00308990478515625, -0.0008716583251953125, 0.001346588134765625, 0.0035648345947265625, 0.0057830810546875, 0.008001327514648438, 0.010219573974609375, 0.012437820434570312, 0.01465606689453125, 0.016874313354492188, 0.019092559814453125, 0.021310806274414062, 0.023529052734375, 0.025747299194335938, 0.027965545654296875, 0.030183792114257812, 0.03240203857421875, 0.03462028503417969, 0.036838531494140625, 0.03905677795410156, 0.0412750244140625, 0.04349327087402344, 0.045711517333984375, 0.04792976379394531, 0.05014801025390625, 0.05236625671386719, 0.054584503173828125, 0.05680274963378906, 0.05902099609375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 11.0, 11.0, 18.0, 28.0, 45.0, 88.0, 174.0, 537.0, 2815.0, 69000.0, 4110898.0, 9103.0, 1006.0, 274.0, 117.0, 72.0, 35.0, 23.0, 14.0, 11.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.195709228515625, -1.13360595703125, -1.071502685546875, -1.0093994140625, -0.947296142578125, -0.88519287109375, -0.823089599609375, -0.760986328125, -0.698883056640625, -0.63677978515625, -0.574676513671875, -0.5125732421875, -0.450469970703125, -0.38836669921875, -0.326263427734375, -0.26416015625, -0.202056884765625, -0.13995361328125, -0.077850341796875, -0.0157470703125, 0.046356201171875, 0.10845947265625, 0.170562744140625, 0.232666015625, 0.294769287109375, 0.35687255859375, 0.418975830078125, 0.4810791015625, 0.543182373046875, 0.60528564453125, 0.667388916015625, 0.7294921875, 0.791595458984375, 0.85369873046875, 0.915802001953125, 0.9779052734375, 1.040008544921875, 1.10211181640625, 1.164215087890625, 1.226318359375, 1.288421630859375, 1.35052490234375, 1.412628173828125, 1.4747314453125, 1.536834716796875, 1.59893798828125, 1.661041259765625, 1.72314453125, 1.785247802734375, 1.84735107421875, 1.909454345703125, 1.9715576171875, 2.033660888671875, 2.09576416015625, 2.157867431640625, 2.219970703125, 2.282073974609375, 2.34417724609375, 2.406280517578125, 2.4683837890625, 2.530487060546875, 2.59259033203125, 2.654693603515625, 2.716796875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 7.0, 13.0, 17.0, 28.0, 70.0, 157.0, 1721.0, 1722.0, 187.0, 76.0, 36.0, 17.0, 13.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18505859375, -0.1741790771484375, -0.163299560546875, -0.1524200439453125, -0.14154052734375, -0.1306610107421875, -0.119781494140625, -0.1089019775390625, -0.0980224609375, -0.0871429443359375, -0.076263427734375, -0.0653839111328125, -0.05450439453125, -0.0436248779296875, -0.032745361328125, -0.0218658447265625, -0.010986328125, -0.0001068115234375, 0.010772705078125, 0.0216522216796875, 0.03253173828125, 0.0434112548828125, 0.054290771484375, 0.0651702880859375, 0.0760498046875, 0.0869293212890625, 0.097808837890625, 0.1086883544921875, 0.11956787109375, 0.1304473876953125, 0.141326904296875, 0.1522064208984375, 0.1630859375, 0.1739654541015625, 0.184844970703125, 0.1957244873046875, 0.20660400390625, 0.2174835205078125, 0.228363037109375, 0.2392425537109375, 0.2501220703125, 0.2610015869140625, 0.271881103515625, 0.2827606201171875, 0.29364013671875, 0.3045196533203125, 0.315399169921875, 0.3262786865234375, 0.337158203125, 0.3480377197265625, 0.358917236328125, 0.3697967529296875, 0.38067626953125, 0.3915557861328125, 0.402435302734375, 0.4133148193359375, 0.4241943359375, 0.4350738525390625, 0.445953369140625, 0.4568328857421875, 0.46771240234375, 0.4785919189453125, 0.489471435546875, 0.5003509521484375, 0.51123046875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 10.0, 42.0, 302.0, 553.0, 83.0, 12.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.904731273651123, -4.761394500732422, -4.618057727813721, -4.474721431732178, -4.331384658813477, -4.188047885894775, -4.044711112976074, -3.901374340057373, -3.758037805557251, -3.61470103263855, -3.4713644981384277, -3.3280277252197266, -3.1846909523010254, -3.0413544178009033, -2.898017644882202, -2.75468111038208, -2.611344337463379, -2.4680075645446777, -2.3246710300445557, -2.1813342571258545, -2.0379977226257324, -1.8946609497070312, -1.75132417678833, -1.6079875230789185, -1.4646508693695068, -1.3213142156600952, -1.1779775619506836, -1.0346407890319824, -0.8913041353225708, -0.7479674816131592, -0.6046307682991028, -0.4612940549850464, -0.31795787811279297, -0.17462119460105896, -0.03128451108932495, 0.11205217242240906, 0.25538885593414307, 0.3987255096435547, 0.5420622229576111, 0.6853989362716675, 0.8287355899810791, 0.9720722436904907, 1.1154088973999023, 1.2587456703186035, 1.4020823240280151, 1.5454189777374268, 1.688755750656128, 1.8320924043655396, 1.9754290580749512, 2.1187658309936523, 2.2621023654937744, 2.4054391384124756, 2.5487756729125977, 2.692112445831299, 2.83544921875, 2.978785991668701, 3.1221225261688232, 3.2654592990875244, 3.4087958335876465, 3.5521326065063477, 3.695469379425049, 3.838805913925171, 3.982142686843872, 4.125479221343994, 4.268815994262695]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 10.0, 12.0, 22.0, 30.0, 32.0, 47.0, 37.0, 73.0, 66.0, 77.0, 74.0, 83.0, 79.0, 72.0, 67.0, 59.0, 48.0, 30.0, 23.0, 16.0, 16.0, 11.0, 8.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.800968587398529, -0.7737975120544434, -0.7466264367103577, -0.719455361366272, -0.6922842264175415, -0.6651132106781006, -0.6379420757293701, -0.6107710003852844, -0.5835999250411987, -0.556428849697113, -0.5292577743530273, -0.5020866990089417, -0.47491559386253357, -0.4477445185184479, -0.4205734133720398, -0.3934023380279541, -0.3662312626838684, -0.3390601873397827, -0.311889111995697, -0.28471800684928894, -0.25754693150520325, -0.23037585616111755, -0.20320476591587067, -0.17603367567062378, -0.14886260032653809, -0.1216915175318718, -0.0945204347372055, -0.06734935194253922, -0.040178269147872925, -0.013007193803787231, 0.014163896441459656, 0.04133498668670654, 0.06850606203079224, 0.09567714482545853, 0.12284822762012482, 0.1500193178653717, 0.1771903932094574, 0.2043614685535431, 0.23153255879878998, 0.25870364904403687, 0.28587472438812256, 0.31304579973220825, 0.34021687507629395, 0.367387980222702, 0.3945590555667877, 0.4217301309108734, 0.4489012360572815, 0.4760723114013672, 0.5032433867454529, 0.5304144620895386, 0.5575855374336243, 0.58475661277771, 0.6119277477264404, 0.6390987634658813, 0.6662698984146118, 0.6934409737586975, 0.7206120491027832, 0.7477831244468689, 0.7749541997909546, 0.8021252751350403, 0.829296350479126, 0.8564674854278564, 0.8836385607719421, 0.9108096361160278, 0.9379807114601135]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 11.0, 13.0, 25.0, 25.0, 33.0, 59.0, 77.0, 123.0, 190.0, 344.0, 637.0, 1166.0, 2713.0, 8013.0, 40709.0, 322460.0, 569450.0, 81645.0, 13581.0, 3778.0, 1610.0, 750.0, 418.0, 260.0, 161.0, 80.0, 59.0, 48.0, 28.0, 24.0, 12.0, 12.0, 12.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3837890625, -0.370635986328125, -0.35748291015625, -0.344329833984375, -0.3311767578125, -0.318023681640625, -0.30487060546875, -0.291717529296875, -0.278564453125, -0.265411376953125, -0.25225830078125, -0.239105224609375, -0.2259521484375, -0.212799072265625, -0.19964599609375, -0.186492919921875, -0.17333984375, -0.160186767578125, -0.14703369140625, -0.133880615234375, -0.1207275390625, -0.107574462890625, -0.09442138671875, -0.081268310546875, -0.068115234375, -0.054962158203125, -0.04180908203125, -0.028656005859375, -0.0155029296875, -0.002349853515625, 0.01080322265625, 0.023956298828125, 0.037109375, 0.050262451171875, 0.06341552734375, 0.076568603515625, 0.0897216796875, 0.102874755859375, 0.11602783203125, 0.129180908203125, 0.142333984375, 0.155487060546875, 0.16864013671875, 0.181793212890625, 0.1949462890625, 0.208099365234375, 0.22125244140625, 0.234405517578125, 0.24755859375, 0.260711669921875, 0.27386474609375, 0.287017822265625, 0.3001708984375, 0.313323974609375, 0.32647705078125, 0.339630126953125, 0.352783203125, 0.365936279296875, 0.37908935546875, 0.392242431640625, 0.4053955078125, 0.418548583984375, 0.43170166015625, 0.444854736328125, 0.4580078125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 3.0, 2.0, 8.0, 5.0, 11.0, 16.0, 32.0, 46.0, 53.0, 65.0, 71.0, 87.0, 108.0, 92.0, 85.0, 64.0, 74.0, 57.0, 40.0, 23.0, 23.0, 9.0, 9.0, 8.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1060791015625, -0.1035466194152832, -0.1010141372680664, -0.09848165512084961, -0.09594917297363281, -0.09341669082641602, -0.09088420867919922, -0.08835172653198242, -0.08581924438476562, -0.08328676223754883, -0.08075428009033203, -0.07822179794311523, -0.07568931579589844, -0.07315683364868164, -0.07062435150146484, -0.06809186935424805, -0.06555938720703125, -0.06302690505981445, -0.060494422912597656, -0.05796194076538086, -0.05542945861816406, -0.052896976470947266, -0.05036449432373047, -0.04783201217651367, -0.045299530029296875, -0.04276704788208008, -0.04023456573486328, -0.037702083587646484, -0.03516960144042969, -0.03263711929321289, -0.030104637145996094, -0.027572154998779297, -0.0250396728515625, -0.022507190704345703, -0.019974708557128906, -0.01744222640991211, -0.014909744262695312, -0.012377262115478516, -0.009844779968261719, -0.007312297821044922, -0.004779815673828125, -0.002247333526611328, 0.00028514862060546875, 0.0028176307678222656, 0.0053501129150390625, 0.00788259506225586, 0.010415077209472656, 0.012947559356689453, 0.01548004150390625, 0.018012523651123047, 0.020545005798339844, 0.02307748794555664, 0.025609970092773438, 0.028142452239990234, 0.03067493438720703, 0.03320741653442383, 0.035739898681640625, 0.03827238082885742, 0.04080486297607422, 0.043337345123291016, 0.04586982727050781, 0.04840230941772461, 0.050934791564941406, 0.0534672737121582, 0.055999755859375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 10.0, 6.0, 9.0, 13.0, 12.0, 18.0, 24.0, 26.0, 45.0, 72.0, 119.0, 293.0, 629.0, 1703.0, 5105.0, 17751.0, 75906.0, 361024.0, 448504.0, 103952.0, 23440.0, 6355.0, 2034.0, 793.0, 315.0, 147.0, 68.0, 43.0, 26.0, 22.0, 14.0, 10.0, 9.0, 9.0, 6.0, 2.0, 7.0, 2.0, 5.0, 6.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22802734375, -0.22045135498046875, -0.2128753662109375, -0.20529937744140625, -0.197723388671875, -0.19014739990234375, -0.1825714111328125, -0.17499542236328125, -0.16741943359375, -0.15984344482421875, -0.1522674560546875, -0.14469146728515625, -0.137115478515625, -0.12953948974609375, -0.1219635009765625, -0.11438751220703125, -0.1068115234375, -0.09923553466796875, -0.0916595458984375, -0.08408355712890625, -0.076507568359375, -0.06893157958984375, -0.0613555908203125, -0.05377960205078125, -0.04620361328125, -0.03862762451171875, -0.0310516357421875, -0.02347564697265625, -0.015899658203125, -0.00832366943359375, -0.0007476806640625, 0.00682830810546875, 0.014404296875, 0.02198028564453125, 0.0295562744140625, 0.03713226318359375, 0.044708251953125, 0.05228424072265625, 0.0598602294921875, 0.06743621826171875, 0.07501220703125, 0.08258819580078125, 0.0901641845703125, 0.09774017333984375, 0.105316162109375, 0.11289215087890625, 0.1204681396484375, 0.12804412841796875, 0.1356201171875, 0.14319610595703125, 0.1507720947265625, 0.15834808349609375, 0.165924072265625, 0.17350006103515625, 0.1810760498046875, 0.18865203857421875, 0.19622802734375, 0.20380401611328125, 0.2113800048828125, 0.21895599365234375, 0.226531982421875, 0.23410797119140625, 0.2416839599609375, 0.24925994873046875, 0.2568359375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 8.0, 6.0, 5.0, 12.0, 12.0, 11.0, 15.0, 14.0, 28.0, 19.0, 33.0, 36.0, 31.0, 48.0, 39.0, 46.0, 53.0, 49.0, 60.0, 36.0, 46.0, 45.0, 42.0, 40.0, 43.0, 34.0, 35.0, 34.0, 24.0, 18.0, 16.0, 12.0, 13.0, 7.0, 3.0, 7.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.168701171875, -0.1628398895263672, -0.15697860717773438, -0.15111732482910156, -0.14525604248046875, -0.13939476013183594, -0.13353347778320312, -0.1276721954345703, -0.1218109130859375, -0.11594963073730469, -0.11008834838867188, -0.10422706604003906, -0.09836578369140625, -0.09250450134277344, -0.08664321899414062, -0.08078193664550781, -0.074920654296875, -0.06905937194824219, -0.06319808959960938, -0.05733680725097656, -0.05147552490234375, -0.04561424255371094, -0.039752960205078125, -0.03389167785644531, -0.0280303955078125, -0.022169113159179688, -0.016307830810546875, -0.010446548461914062, -0.00458526611328125, 0.0012760162353515625, 0.007137298583984375, 0.012998580932617188, 0.01885986328125, 0.024721145629882812, 0.030582427978515625, 0.03644371032714844, 0.04230499267578125, 0.04816627502441406, 0.054027557373046875, 0.05988883972167969, 0.0657501220703125, 0.07161140441894531, 0.07747268676757812, 0.08333396911621094, 0.08919525146484375, 0.09505653381347656, 0.10091781616210938, 0.10677909851074219, 0.112640380859375, 0.11850166320800781, 0.12436294555664062, 0.13022422790527344, 0.13608551025390625, 0.14194679260253906, 0.14780807495117188, 0.1536693572998047, 0.1595306396484375, 0.1653919219970703, 0.17125320434570312, 0.17711448669433594, 0.18297576904296875, 0.18883705139160156, 0.19469833374023438, 0.2005596160888672, 0.2064208984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 4.0, 6.0, 20.0, 15.0, 30.0, 50.0, 84.0, 197.0, 521.0, 1681.0, 5959.0, 29032.0, 247890.0, 650519.0, 93020.0, 14493.0, 3382.0, 993.0, 317.0, 141.0, 59.0, 41.0, 17.0, 14.0, 14.0, 12.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.144287109375, -0.14007949829101562, -0.13587188720703125, -0.13166427612304688, -0.1274566650390625, -0.12324905395507812, -0.11904144287109375, -0.11483383178710938, -0.110626220703125, -0.10641860961914062, -0.10221099853515625, -0.09800338745117188, -0.0937957763671875, -0.08958816528320312, -0.08538055419921875, -0.08117294311523438, -0.07696533203125, -0.07275772094726562, -0.06855010986328125, -0.06434249877929688, -0.0601348876953125, -0.055927276611328125, -0.05171966552734375, -0.047512054443359375, -0.043304443359375, -0.039096832275390625, -0.03488922119140625, -0.030681610107421875, -0.0264739990234375, -0.022266387939453125, -0.01805877685546875, -0.013851165771484375, -0.0096435546875, -0.005435943603515625, -0.00122833251953125, 0.002979278564453125, 0.0071868896484375, 0.011394500732421875, 0.01560211181640625, 0.019809722900390625, 0.024017333984375, 0.028224945068359375, 0.03243255615234375, 0.036640167236328125, 0.0408477783203125, 0.045055389404296875, 0.04926300048828125, 0.053470611572265625, 0.05767822265625, 0.061885833740234375, 0.06609344482421875, 0.07030105590820312, 0.0745086669921875, 0.07871627807617188, 0.08292388916015625, 0.08713150024414062, 0.091339111328125, 0.09554672241210938, 0.09975433349609375, 0.10396194458007812, 0.1081695556640625, 0.11237716674804688, 0.11658477783203125, 0.12079238891601562, 0.125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 3.0, 10.0, 11.0, 9.0, 11.0, 13.0, 23.0, 26.0, 28.0, 45.0, 47.0, 66.0, 63.0, 64.0, 74.0, 75.0, 57.0, 63.0, 63.0, 50.0, 45.0, 37.0, 16.0, 16.0, 15.0, 11.0, 12.0, 8.0, 8.0, 8.0, 4.0, 4.0, 2.0, 4.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3768672943115234e-05, -1.3364478945732117e-05, -1.2960284948348999e-05, -1.2556090950965881e-05, -1.2151896953582764e-05, -1.1747702956199646e-05, -1.1343508958816528e-05, -1.093931496143341e-05, -1.0535120964050293e-05, -1.0130926966667175e-05, -9.726732969284058e-06, -9.32253897190094e-06, -8.918344974517822e-06, -8.514150977134705e-06, -8.109956979751587e-06, -7.70576298236847e-06, -7.3015689849853516e-06, -6.897374987602234e-06, -6.493180990219116e-06, -6.0889869928359985e-06, -5.684792995452881e-06, -5.280598998069763e-06, -4.8764050006866455e-06, -4.472211003303528e-06, -4.06801700592041e-06, -3.6638230085372925e-06, -3.259629011154175e-06, -2.855435013771057e-06, -2.4512410163879395e-06, -2.0470470190048218e-06, -1.642853021621704e-06, -1.2386590242385864e-06, -8.344650268554688e-07, -4.302710294723511e-07, -2.60770320892334e-08, 3.781169652938843e-07, 7.82310962677002e-07, 1.1865049600601196e-06, 1.5906989574432373e-06, 1.994892954826355e-06, 2.3990869522094727e-06, 2.8032809495925903e-06, 3.207474946975708e-06, 3.6116689443588257e-06, 4.015862941741943e-06, 4.420056939125061e-06, 4.824250936508179e-06, 5.228444933891296e-06, 5.632638931274414e-06, 6.036832928657532e-06, 6.441026926040649e-06, 6.845220923423767e-06, 7.249414920806885e-06, 7.653608918190002e-06, 8.05780291557312e-06, 8.461996912956238e-06, 8.866190910339355e-06, 9.270384907722473e-06, 9.67457890510559e-06, 1.0078772902488708e-05, 1.0482966899871826e-05, 1.0887160897254944e-05, 1.1291354894638062e-05, 1.169554889202118e-05, 1.2099742889404297e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 11.0, 15.0, 22.0, 41.0, 48.0, 80.0, 205.0, 376.0, 873.0, 2160.0, 6910.0, 27848.0, 173157.0, 650181.0, 151148.0, 25338.0, 6405.0, 2124.0, 826.0, 383.0, 154.0, 102.0, 44.0, 25.0, 15.0, 20.0, 7.0, 7.0, 3.0, 2.0, 7.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.148681640625, -0.14448928833007812, -0.14029693603515625, -0.13610458374023438, -0.1319122314453125, -0.12771987915039062, -0.12352752685546875, -0.11933517456054688, -0.115142822265625, -0.11095046997070312, -0.10675811767578125, -0.10256576538085938, -0.0983734130859375, -0.09418106079101562, -0.08998870849609375, -0.08579635620117188, -0.08160400390625, -0.07741165161132812, -0.07321929931640625, -0.06902694702148438, -0.0648345947265625, -0.060642242431640625, -0.05644989013671875, -0.052257537841796875, -0.048065185546875, -0.043872833251953125, -0.03968048095703125, -0.035488128662109375, -0.0312957763671875, -0.027103424072265625, -0.02291107177734375, -0.018718719482421875, -0.0145263671875, -0.010334014892578125, -0.00614166259765625, -0.001949310302734375, 0.0022430419921875, 0.006435394287109375, 0.01062774658203125, 0.014820098876953125, 0.019012451171875, 0.023204803466796875, 0.02739715576171875, 0.031589508056640625, 0.0357818603515625, 0.039974212646484375, 0.04416656494140625, 0.048358917236328125, 0.05255126953125, 0.056743621826171875, 0.06093597412109375, 0.06512832641601562, 0.0693206787109375, 0.07351303100585938, 0.07770538330078125, 0.08189773559570312, 0.086090087890625, 0.09028244018554688, 0.09447479248046875, 0.09866714477539062, 0.1028594970703125, 0.10705184936523438, 0.11124420166015625, 0.11543655395507812, 0.11962890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 3.0, 2.0, 0.0, 5.0, 3.0, 7.0, 6.0, 14.0, 8.0, 13.0, 16.0, 20.0, 17.0, 30.0, 37.0, 36.0, 38.0, 53.0, 66.0, 77.0, 65.0, 64.0, 80.0, 52.0, 51.0, 45.0, 35.0, 39.0, 27.0, 14.0, 17.0, 19.0, 13.0, 10.0, 7.0, 3.0, 3.0, 5.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.068115234375, -0.06585979461669922, -0.06360435485839844, -0.061348915100097656, -0.059093475341796875, -0.056838035583496094, -0.05458259582519531, -0.05232715606689453, -0.05007171630859375, -0.04781627655029297, -0.04556083679199219, -0.043305397033691406, -0.041049957275390625, -0.038794517517089844, -0.03653907775878906, -0.03428363800048828, -0.0320281982421875, -0.02977275848388672, -0.027517318725585938, -0.025261878967285156, -0.023006439208984375, -0.020750999450683594, -0.018495559692382812, -0.01624011993408203, -0.01398468017578125, -0.011729240417480469, -0.009473800659179688, -0.007218360900878906, -0.004962921142578125, -0.0027074813842773438, -0.0004520416259765625, 0.0018033981323242188, 0.004058837890625, 0.006314277648925781, 0.008569717407226562, 0.010825157165527344, 0.013080596923828125, 0.015336036682128906, 0.017591476440429688, 0.01984691619873047, 0.02210235595703125, 0.02435779571533203, 0.026613235473632812, 0.028868675231933594, 0.031124114990234375, 0.033379554748535156, 0.03563499450683594, 0.03789043426513672, 0.0401458740234375, 0.04240131378173828, 0.04465675354003906, 0.046912193298339844, 0.049167633056640625, 0.051423072814941406, 0.05367851257324219, 0.05593395233154297, 0.05818939208984375, 0.06044483184814453, 0.06270027160644531, 0.0649557113647461, 0.06721115112304688, 0.06946659088134766, 0.07172203063964844, 0.07397747039794922, 0.07623291015625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 8.0, 8.0, 13.0, 27.0, 35.0, 50.0, 71.0, 99.0, 117.0, 134.0, 120.0, 86.0, 89.0, 50.0, 38.0, 17.0, 10.0, 8.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5131348371505737, -1.4719043970108032, -1.4306739568710327, -1.3894436359405518, -1.3482131958007812, -1.3069827556610107, -1.2657523155212402, -1.2245218753814697, -1.1832914352416992, -1.1420609951019287, -1.1008305549621582, -1.0596002340316772, -1.0183697938919067, -0.9771393537521362, -0.9359089136123657, -0.8946784734725952, -0.8534481525421143, -0.8122177124023438, -0.770987331867218, -0.7297568917274475, -0.6885265111923218, -0.6472960710525513, -0.6060656309127808, -0.5648351907730103, -0.5236048102378845, -0.4823743999004364, -0.4411439895629883, -0.3999135494232178, -0.35868313908576965, -0.31745272874832153, -0.276222288608551, -0.2349918782711029, -0.19376158714294434, -0.15253117680549622, -0.1113007515668869, -0.07007033377885818, -0.028839915990829468, 0.012390494346618652, 0.053620919585227966, 0.09485134482383728, 0.1360817551612854, 0.17731216549873352, 0.21854259073734283, 0.25977301597595215, 0.30100342631340027, 0.3422338366508484, 0.3834642767906189, 0.424694687128067, 0.46592509746551514, 0.5071555376052856, 0.5483859181404114, 0.5896163582801819, 0.6308467388153076, 0.6720771789550781, 0.7133076190948486, 0.7545380592346191, 0.7957684397697449, 0.8369988799095154, 0.8782292604446411, 0.9194597005844116, 0.9606901407241821, 1.001920461654663, 1.0431509017944336, 1.084381341934204, 1.1256117820739746]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 4.0, 7.0, 5.0, 10.0, 14.0, 12.0, 16.0, 26.0, 22.0, 34.0, 32.0, 40.0, 39.0, 52.0, 40.0, 45.0, 60.0, 53.0, 52.0, 57.0, 71.0, 55.0, 43.0, 35.0, 38.0, 32.0, 20.0, 27.0, 15.0, 10.0, 14.0, 13.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.4112226963043213, -1.3726794719696045, -1.3341362476348877, -1.295593023300171, -1.257049798965454, -1.2185065746307373, -1.1799633502960205, -1.1414200067520142, -1.1028767824172974, -1.0643335580825806, -1.0257903337478638, -0.987247109413147, -0.9487038254737854, -0.9101606011390686, -0.8716173768043518, -0.8330740928649902, -0.7945309281349182, -0.7559877038002014, -0.7174444794654846, -0.678901195526123, -0.6403579711914062, -0.6018147468566895, -0.5632715225219727, -0.5247282981872559, -0.4861850440502167, -0.4476418197154999, -0.4090985655784607, -0.3705553412437439, -0.3320121169090271, -0.2934688627719879, -0.2549256384372711, -0.21638238430023193, -0.17783915996551514, -0.13929592072963715, -0.10075268894433975, -0.06220945715904236, -0.023666217923164368, 0.014877021312713623, 0.05342024564743042, 0.0919634997844696, 0.1305067241191864, 0.1690499633550644, 0.20759320259094238, 0.24613642692565918, 0.284679651260376, 0.32322290539741516, 0.36176612973213196, 0.40030938386917114, 0.43885260820388794, 0.47739583253860474, 0.5159390568733215, 0.5544823408126831, 0.5930255651473999, 0.6315687894821167, 0.6701120138168335, 0.7086552381515503, 0.7471984624862671, 0.7857416868209839, 0.8242849111557007, 0.8628281354904175, 0.901371419429779, 0.9399146437644958, 0.9784578680992126, 1.0170011520385742, 1.055544376373291]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 4.0, 6.0, 2.0, 7.0, 13.0, 13.0, 16.0, 21.0, 40.0, 64.0, 84.0, 107.0, 186.0, 367.0, 559.0, 1390.0, 4423.0, 24596.0, 4008091.0, 140017.0, 9933.0, 2533.0, 875.0, 390.0, 220.0, 120.0, 77.0, 46.0, 28.0, 13.0, 6.0, 7.0, 5.0, 3.0, 6.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.791015625, -0.7694931030273438, -0.7479705810546875, -0.7264480590820312, -0.704925537109375, -0.6834030151367188, -0.6618804931640625, -0.6403579711914062, -0.61883544921875, -0.5973129272460938, -0.5757904052734375, -0.5542678833007812, -0.532745361328125, -0.5112228393554688, -0.4897003173828125, -0.46817779541015625, -0.4466552734375, -0.42513275146484375, -0.4036102294921875, -0.38208770751953125, -0.360565185546875, -0.33904266357421875, -0.3175201416015625, -0.29599761962890625, -0.27447509765625, -0.25295257568359375, -0.2314300537109375, -0.20990753173828125, -0.188385009765625, -0.16686248779296875, -0.1453399658203125, -0.12381744384765625, -0.102294921875, -0.08077239990234375, -0.0592498779296875, -0.03772735595703125, -0.016204833984375, 0.00531768798828125, 0.0268402099609375, 0.04836273193359375, 0.06988525390625, 0.09140777587890625, 0.1129302978515625, 0.13445281982421875, 0.155975341796875, 0.17749786376953125, 0.1990203857421875, 0.22054290771484375, 0.2420654296875, 0.26358795166015625, 0.2851104736328125, 0.30663299560546875, 0.328155517578125, 0.34967803955078125, 0.3712005615234375, 0.39272308349609375, 0.41424560546875, 0.43576812744140625, 0.4572906494140625, 0.47881317138671875, 0.500335693359375, 0.5218582153320312, 0.5433807373046875, 0.5649032592773438, 0.58642578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 9.0, 12.0, 15.0, 27.0, 30.0, 44.0, 49.0, 54.0, 81.0, 79.0, 96.0, 96.0, 80.0, 64.0, 60.0, 54.0, 48.0, 29.0, 18.0, 15.0, 15.0, 5.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0999755859375, -0.09753036499023438, -0.09508514404296875, -0.09263992309570312, -0.0901947021484375, -0.08774948120117188, -0.08530426025390625, -0.08285903930664062, -0.080413818359375, -0.07796859741210938, -0.07552337646484375, -0.07307815551757812, -0.0706329345703125, -0.06818771362304688, -0.06574249267578125, -0.06329727172851562, -0.06085205078125, -0.058406829833984375, -0.05596160888671875, -0.053516387939453125, -0.0510711669921875, -0.048625946044921875, -0.04618072509765625, -0.043735504150390625, -0.041290283203125, -0.038845062255859375, -0.03639984130859375, -0.033954620361328125, -0.0315093994140625, -0.029064178466796875, -0.02661895751953125, -0.024173736572265625, -0.021728515625, -0.019283294677734375, -0.01683807373046875, -0.014392852783203125, -0.0119476318359375, -0.009502410888671875, -0.00705718994140625, -0.004611968994140625, -0.002166748046875, 0.000278472900390625, 0.00272369384765625, 0.005168914794921875, 0.0076141357421875, 0.010059356689453125, 0.01250457763671875, 0.014949798583984375, 0.01739501953125, 0.019840240478515625, 0.02228546142578125, 0.024730682373046875, 0.0271759033203125, 0.029621124267578125, 0.03206634521484375, 0.034511566162109375, 0.036956787109375, 0.039402008056640625, 0.04184722900390625, 0.044292449951171875, 0.0467376708984375, 0.049182891845703125, 0.05162811279296875, 0.054073333740234375, 0.0565185546875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 10.0, 20.0, 29.0, 37.0, 79.0, 115.0, 231.0, 520.0, 2398.0, 21854.0, 4095545.0, 67294.0, 4605.0, 848.0, 294.0, 146.0, 110.0, 54.0, 40.0, 26.0, 22.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80810546875, -0.7753372192382812, -0.7425689697265625, -0.7098007202148438, -0.677032470703125, -0.6442642211914062, -0.6114959716796875, -0.5787277221679688, -0.54595947265625, -0.5131912231445312, -0.4804229736328125, -0.44765472412109375, -0.414886474609375, -0.38211822509765625, -0.3493499755859375, -0.31658172607421875, -0.2838134765625, -0.25104522705078125, -0.2182769775390625, -0.18550872802734375, -0.152740478515625, -0.11997222900390625, -0.0872039794921875, -0.05443572998046875, -0.02166748046875, 0.01110076904296875, 0.0438690185546875, 0.07663726806640625, 0.109405517578125, 0.14217376708984375, 0.1749420166015625, 0.20771026611328125, 0.240478515625, 0.27324676513671875, 0.3060150146484375, 0.33878326416015625, 0.371551513671875, 0.40431976318359375, 0.4370880126953125, 0.46985626220703125, 0.50262451171875, 0.5353927612304688, 0.5681610107421875, 0.6009292602539062, 0.633697509765625, 0.6664657592773438, 0.6992340087890625, 0.7320022583007812, 0.7647705078125, 0.7975387573242188, 0.8303070068359375, 0.8630752563476562, 0.895843505859375, 0.9286117553710938, 0.9613800048828125, 0.9941482543945312, 1.02691650390625, 1.0596847534179688, 1.0924530029296875, 1.1252212524414062, 1.157989501953125, 1.1907577514648438, 1.2235260009765625, 1.2562942504882812, 1.2890625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 7.0, 4.0, 6.0, 15.0, 21.0, 38.0, 89.0, 423.0, 2505.0, 661.0, 129.0, 71.0, 28.0, 24.0, 16.0, 19.0, 6.0, 6.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.140380859375, -0.13417434692382812, -0.12796783447265625, -0.12176132202148438, -0.1155548095703125, -0.10934829711914062, -0.10314178466796875, -0.09693527221679688, -0.090728759765625, -0.08452224731445312, -0.07831573486328125, -0.07210922241210938, -0.0659027099609375, -0.059696197509765625, -0.05348968505859375, -0.047283172607421875, -0.04107666015625, -0.034870147705078125, -0.02866363525390625, -0.022457122802734375, -0.0162506103515625, -0.010044097900390625, -0.00383758544921875, 0.002368927001953125, 0.008575439453125, 0.014781951904296875, 0.02098846435546875, 0.027194976806640625, 0.0334014892578125, 0.039608001708984375, 0.04581451416015625, 0.052021026611328125, 0.0582275390625, 0.06443405151367188, 0.07064056396484375, 0.07684707641601562, 0.0830535888671875, 0.08926010131835938, 0.09546661376953125, 0.10167312622070312, 0.107879638671875, 0.11408615112304688, 0.12029266357421875, 0.12649917602539062, 0.1327056884765625, 0.13891220092773438, 0.14511871337890625, 0.15132522583007812, 0.15753173828125, 0.16373825073242188, 0.16994476318359375, 0.17615127563476562, 0.1823577880859375, 0.18856430053710938, 0.19477081298828125, 0.20097732543945312, 0.207183837890625, 0.21339035034179688, 0.21959686279296875, 0.22580337524414062, 0.2320098876953125, 0.23821640014648438, 0.24442291259765625, 0.2506294250488281, 0.2568359375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 34.0, 183.0, 443.0, 243.0, 63.0, 23.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7203451991081238, -0.6518954038619995, -0.58344566822052, -0.5149959325790405, -0.44654613733291626, -0.3780963718891144, -0.3096466064453125, -0.24119684100151062, -0.17274707555770874, -0.10429731011390686, -0.03584754467010498, 0.0326022207736969, 0.10105198621749878, 0.16950175166130066, 0.23795151710510254, 0.3064012825489044, 0.3748510479927063, 0.4433008134365082, 0.5117505788803101, 0.5802003145217896, 0.6486501097679138, 0.7170999050140381, 0.7855496406555176, 0.8539993762969971, 0.9224491715431213, 0.9908989667892456, 1.059348702430725, 1.1277984380722046, 1.1962482929229736, 1.2646980285644531, 1.3331477642059326, 1.401597499847412, 1.4700474739074707, 1.5384972095489502, 1.6069469451904297, 1.6753968000411987, 1.7438465356826782, 1.8122962713241577, 1.8807461261749268, 1.9491958618164062, 2.0176455974578857, 2.0860953330993652, 2.1545450687408447, 2.222994804382324, 2.291444778442383, 2.3598945140838623, 2.428344249725342, 2.4967939853668213, 2.565243721008301, 2.6336934566497803, 2.7021431922912598, 2.7705929279327393, 2.8390426635742188, 2.9074926376342773, 2.975942373275757, 3.0443921089172363, 3.112841844558716, 3.1812915802001953, 3.249741315841675, 3.3181910514831543, 3.386641025543213, 3.4550907611846924, 3.523540496826172, 3.5919902324676514, 3.660439968109131]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 13.0, 19.0, 31.0, 23.0, 36.0, 47.0, 46.0, 67.0, 81.0, 70.0, 73.0, 74.0, 71.0, 63.0, 58.0, 61.0, 47.0, 28.0, 27.0, 20.0, 13.0, 11.0, 3.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45294004678726196, -0.4334803521633148, -0.4140206277370453, -0.39456093311309814, -0.3751012086868286, -0.35564151406288147, -0.3361818194389343, -0.3167220950126648, -0.29726240038871765, -0.2778027057647705, -0.258342981338501, -0.23888328671455383, -0.2194235771894455, -0.19996386766433716, -0.18050417304039001, -0.16104446351528168, -0.14158475399017334, -0.122125044465065, -0.10266534239053726, -0.08320564031600952, -0.06374593079090118, -0.04428622126579285, -0.024826519191265106, -0.005366817116737366, 0.014092892408370972, 0.03355259820818901, 0.05301230400800705, 0.07247200608253479, 0.09193171560764313, 0.11139142513275146, 0.1308511197566986, 0.15031082928180695, 0.16977059841156006, 0.1892303079366684, 0.20869001746177673, 0.22814971208572388, 0.24760942161083221, 0.26706913113594055, 0.2865288257598877, 0.3059885501861572, 0.32544824481010437, 0.3449079394340515, 0.36436766386032104, 0.3838273584842682, 0.40328705310821533, 0.42274677753448486, 0.442206472158432, 0.46166616678237915, 0.4811258912086487, 0.5005856156349182, 0.520045280456543, 0.5395050048828125, 0.558964729309082, 0.5784244537353516, 0.5978841185569763, 0.6173438429832458, 0.6368035078048706, 0.6562632322311401, 0.6757228970527649, 0.6951826214790344, 0.714642345905304, 0.7341020107269287, 0.7535617351531982, 0.7730214595794678, 0.7924811840057373]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 8.0, 10.0, 11.0, 17.0, 28.0, 45.0, 59.0, 74.0, 88.0, 169.0, 245.0, 417.0, 844.0, 1601.0, 3841.0, 12177.0, 56080.0, 353257.0, 505616.0, 87448.0, 17283.0, 5003.0, 2006.0, 871.0, 489.0, 310.0, 166.0, 110.0, 81.0, 56.0, 36.0, 36.0, 19.0, 15.0, 13.0, 11.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.314208984375, -0.3034210205078125, -0.292633056640625, -0.2818450927734375, -0.27105712890625, -0.2602691650390625, -0.249481201171875, -0.2386932373046875, -0.2279052734375, -0.2171173095703125, -0.206329345703125, -0.1955413818359375, -0.18475341796875, -0.1739654541015625, -0.163177490234375, -0.1523895263671875, -0.1416015625, -0.1308135986328125, -0.120025634765625, -0.1092376708984375, -0.09844970703125, -0.0876617431640625, -0.076873779296875, -0.0660858154296875, -0.0552978515625, -0.0445098876953125, -0.033721923828125, -0.0229339599609375, -0.01214599609375, -0.0013580322265625, 0.009429931640625, 0.0202178955078125, 0.031005859375, 0.0417938232421875, 0.052581787109375, 0.0633697509765625, 0.07415771484375, 0.0849456787109375, 0.095733642578125, 0.1065216064453125, 0.1173095703125, 0.1280975341796875, 0.138885498046875, 0.1496734619140625, 0.16046142578125, 0.1712493896484375, 0.182037353515625, 0.1928253173828125, 0.20361328125, 0.2144012451171875, 0.225189208984375, 0.2359771728515625, 0.24676513671875, 0.2575531005859375, 0.268341064453125, 0.2791290283203125, 0.2899169921875, 0.3007049560546875, 0.311492919921875, 0.3222808837890625, 0.33306884765625, 0.3438568115234375, 0.354644775390625, 0.3654327392578125, 0.376220703125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 0.0, 4.0, 6.0, 14.0, 14.0, 15.0, 24.0, 26.0, 34.0, 58.0, 64.0, 59.0, 63.0, 94.0, 74.0, 82.0, 58.0, 72.0, 54.0, 38.0, 37.0, 30.0, 28.0, 16.0, 14.0, 3.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0941162109375, -0.09177923202514648, -0.08944225311279297, -0.08710527420043945, -0.08476829528808594, -0.08243131637573242, -0.0800943374633789, -0.07775735855102539, -0.07542037963867188, -0.07308340072631836, -0.07074642181396484, -0.06840944290161133, -0.06607246398925781, -0.0637354850769043, -0.06139850616455078, -0.059061527252197266, -0.05672454833984375, -0.054387569427490234, -0.05205059051513672, -0.0497136116027832, -0.04737663269042969, -0.04503965377807617, -0.042702674865722656, -0.04036569595336914, -0.038028717041015625, -0.03569173812866211, -0.033354759216308594, -0.031017780303955078, -0.028680801391601562, -0.026343822479248047, -0.02400684356689453, -0.021669864654541016, -0.0193328857421875, -0.016995906829833984, -0.014658927917480469, -0.012321949005126953, -0.009984970092773438, -0.007647991180419922, -0.005311012268066406, -0.0029740333557128906, -0.000637054443359375, 0.0016999244689941406, 0.004036903381347656, 0.006373882293701172, 0.008710861206054688, 0.011047840118408203, 0.013384819030761719, 0.015721797943115234, 0.01805877685546875, 0.020395755767822266, 0.02273273468017578, 0.025069713592529297, 0.027406692504882812, 0.029743671417236328, 0.032080650329589844, 0.03441762924194336, 0.036754608154296875, 0.03909158706665039, 0.041428565979003906, 0.04376554489135742, 0.04610252380371094, 0.04843950271606445, 0.05077648162841797, 0.053113460540771484, 0.055450439453125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 8.0, 2.0, 6.0, 10.0, 9.0, 19.0, 21.0, 39.0, 58.0, 135.0, 283.0, 750.0, 2707.0, 12433.0, 83867.0, 600741.0, 303234.0, 35368.0, 6321.0, 1619.0, 485.0, 206.0, 87.0, 51.0, 30.0, 17.0, 16.0, 12.0, 10.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34814453125, -0.3378410339355469, -0.32753753662109375, -0.3172340393066406, -0.3069305419921875, -0.2966270446777344, -0.28632354736328125, -0.2760200500488281, -0.265716552734375, -0.2554130554199219, -0.24510955810546875, -0.23480606079101562, -0.2245025634765625, -0.21419906616210938, -0.20389556884765625, -0.19359207153320312, -0.18328857421875, -0.17298507690429688, -0.16268157958984375, -0.15237808227539062, -0.1420745849609375, -0.13177108764648438, -0.12146759033203125, -0.11116409301757812, -0.100860595703125, -0.09055709838867188, -0.08025360107421875, -0.06995010375976562, -0.0596466064453125, -0.049343109130859375, -0.03903961181640625, -0.028736114501953125, -0.0184326171875, -0.008129119873046875, 0.00217437744140625, 0.012477874755859375, 0.0227813720703125, 0.033084869384765625, 0.04338836669921875, 0.053691864013671875, 0.063995361328125, 0.07429885864257812, 0.08460235595703125, 0.09490585327148438, 0.1052093505859375, 0.11551284790039062, 0.12581634521484375, 0.13611984252929688, 0.14642333984375, 0.15672683715820312, 0.16703033447265625, 0.17733383178710938, 0.1876373291015625, 0.19794082641601562, 0.20824432373046875, 0.21854782104492188, 0.228851318359375, 0.23915481567382812, 0.24945831298828125, 0.2597618103027344, 0.2700653076171875, 0.2803688049316406, 0.29067230224609375, 0.3009757995605469, 0.311279296875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 8.0, 11.0, 14.0, 14.0, 9.0, 17.0, 23.0, 23.0, 41.0, 41.0, 36.0, 40.0, 36.0, 43.0, 52.0, 39.0, 54.0, 48.0, 48.0, 46.0, 47.0, 39.0, 34.0, 43.0, 21.0, 29.0, 18.0, 25.0, 20.0, 9.0, 19.0, 12.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2188720703125, -0.21256256103515625, -0.2062530517578125, -0.19994354248046875, -0.193634033203125, -0.18732452392578125, -0.1810150146484375, -0.17470550537109375, -0.16839599609375, -0.16208648681640625, -0.1557769775390625, -0.14946746826171875, -0.143157958984375, -0.13684844970703125, -0.1305389404296875, -0.12422943115234375, -0.117919921875, -0.11161041259765625, -0.1053009033203125, -0.09899139404296875, -0.092681884765625, -0.08637237548828125, -0.0800628662109375, -0.07375335693359375, -0.06744384765625, -0.06113433837890625, -0.0548248291015625, -0.04851531982421875, -0.042205810546875, -0.03589630126953125, -0.0295867919921875, -0.02327728271484375, -0.0169677734375, -0.01065826416015625, -0.0043487548828125, 0.00196075439453125, 0.008270263671875, 0.01457977294921875, 0.0208892822265625, 0.02719879150390625, 0.03350830078125, 0.03981781005859375, 0.0461273193359375, 0.05243682861328125, 0.058746337890625, 0.06505584716796875, 0.0713653564453125, 0.07767486572265625, 0.083984375, 0.09029388427734375, 0.0966033935546875, 0.10291290283203125, 0.109222412109375, 0.11553192138671875, 0.1218414306640625, 0.12815093994140625, 0.13446044921875, 0.14076995849609375, 0.1470794677734375, 0.15338897705078125, 0.159698486328125, 0.16600799560546875, 0.1723175048828125, 0.17862701416015625, 0.1849365234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 11.0, 12.0, 17.0, 29.0, 36.0, 74.0, 131.0, 235.0, 509.0, 1078.0, 3237.0, 13398.0, 99857.0, 646438.0, 249033.0, 26204.0, 5182.0, 1675.0, 654.0, 332.0, 155.0, 91.0, 56.0, 35.0, 17.0, 18.0, 10.0, 8.0, 4.0, 5.0, 5.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1473388671875, -0.14353084564208984, -0.1397228240966797, -0.13591480255126953, -0.13210678100585938, -0.12829875946044922, -0.12449073791503906, -0.1206827163696289, -0.11687469482421875, -0.1130666732788086, -0.10925865173339844, -0.10545063018798828, -0.10164260864257812, -0.09783458709716797, -0.09402656555175781, -0.09021854400634766, -0.0864105224609375, -0.08260250091552734, -0.07879447937011719, -0.07498645782470703, -0.07117843627929688, -0.06737041473388672, -0.06356239318847656, -0.059754371643066406, -0.05594635009765625, -0.052138328552246094, -0.04833030700683594, -0.04452228546142578, -0.040714263916015625, -0.03690624237060547, -0.03309822082519531, -0.029290199279785156, -0.025482177734375, -0.021674156188964844, -0.017866134643554688, -0.014058113098144531, -0.010250091552734375, -0.006442070007324219, -0.0026340484619140625, 0.0011739730834960938, 0.00498199462890625, 0.008790016174316406, 0.012598037719726562, 0.01640605926513672, 0.020214080810546875, 0.02402210235595703, 0.027830123901367188, 0.031638145446777344, 0.0354461669921875, 0.039254188537597656, 0.04306221008300781, 0.04687023162841797, 0.050678253173828125, 0.05448627471923828, 0.05829429626464844, 0.062102317810058594, 0.06591033935546875, 0.0697183609008789, 0.07352638244628906, 0.07733440399169922, 0.08114242553710938, 0.08495044708251953, 0.08875846862792969, 0.09256649017333984, 0.09637451171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 11.0, 13.0, 19.0, 26.0, 52.0, 47.0, 113.0, 148.0, 139.0, 111.0, 103.0, 82.0, 49.0, 33.0, 18.0, 12.0, 6.0, 8.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5928020477294922e-05, -2.507586032152176e-05, -2.4223700165748596e-05, -2.3371540009975433e-05, -2.251937985420227e-05, -2.1667219698429108e-05, -2.0815059542655945e-05, -1.9962899386882782e-05, -1.911073923110962e-05, -1.8258579075336456e-05, -1.7406418919563293e-05, -1.655425876379013e-05, -1.5702098608016968e-05, -1.4849938452243805e-05, -1.3997778296470642e-05, -1.314561814069748e-05, -1.2293457984924316e-05, -1.1441297829151154e-05, -1.058913767337799e-05, -9.736977517604828e-06, -8.884817361831665e-06, -8.032657206058502e-06, -7.180497050285339e-06, -6.3283368945121765e-06, -5.476176738739014e-06, -4.624016582965851e-06, -3.771856427192688e-06, -2.919696271419525e-06, -2.0675361156463623e-06, -1.2153759598731995e-06, -3.632158041000366e-07, 4.889443516731262e-07, 1.341104507446289e-06, 2.193264663219452e-06, 3.0454248189926147e-06, 3.897584974765778e-06, 4.7497451305389404e-06, 5.601905286312103e-06, 6.454065442085266e-06, 7.306225597858429e-06, 8.158385753631592e-06, 9.010545909404755e-06, 9.862706065177917e-06, 1.071486622095108e-05, 1.1567026376724243e-05, 1.2419186532497406e-05, 1.3271346688270569e-05, 1.4123506844043732e-05, 1.4975666999816895e-05, 1.5827827155590057e-05, 1.667998731136322e-05, 1.7532147467136383e-05, 1.8384307622909546e-05, 1.923646777868271e-05, 2.008862793445587e-05, 2.0940788090229034e-05, 2.1792948246002197e-05, 2.264510840177536e-05, 2.3497268557548523e-05, 2.4349428713321686e-05, 2.520158886909485e-05, 2.605374902486801e-05, 2.6905909180641174e-05, 2.7758069336414337e-05, 2.86102294921875e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 6.0, 5.0, 13.0, 12.0, 26.0, 29.0, 63.0, 159.0, 264.0, 649.0, 1665.0, 4771.0, 19480.0, 161841.0, 705782.0, 129972.0, 16842.0, 4345.0, 1531.0, 570.0, 257.0, 128.0, 64.0, 27.0, 13.0, 10.0, 9.0, 2.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.162841796875, -0.1582489013671875, -0.153656005859375, -0.1490631103515625, -0.14447021484375, -0.1398773193359375, -0.135284423828125, -0.1306915283203125, -0.1260986328125, -0.1215057373046875, -0.116912841796875, -0.1123199462890625, -0.10772705078125, -0.1031341552734375, -0.098541259765625, -0.0939483642578125, -0.08935546875, -0.0847625732421875, -0.080169677734375, -0.0755767822265625, -0.07098388671875, -0.0663909912109375, -0.061798095703125, -0.0572052001953125, -0.0526123046875, -0.0480194091796875, -0.043426513671875, -0.0388336181640625, -0.03424072265625, -0.0296478271484375, -0.025054931640625, -0.0204620361328125, -0.015869140625, -0.0112762451171875, -0.006683349609375, -0.0020904541015625, 0.00250244140625, 0.0070953369140625, 0.011688232421875, 0.0162811279296875, 0.0208740234375, 0.0254669189453125, 0.030059814453125, 0.0346527099609375, 0.03924560546875, 0.0438385009765625, 0.048431396484375, 0.0530242919921875, 0.0576171875, 0.0622100830078125, 0.066802978515625, 0.0713958740234375, 0.07598876953125, 0.0805816650390625, 0.085174560546875, 0.0897674560546875, 0.0943603515625, 0.0989532470703125, 0.103546142578125, 0.1081390380859375, 0.11273193359375, 0.1173248291015625, 0.121917724609375, 0.1265106201171875, 0.131103515625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 13.0, 7.0, 13.0, 18.0, 13.0, 18.0, 36.0, 51.0, 49.0, 60.0, 58.0, 61.0, 70.0, 54.0, 78.0, 76.0, 62.0, 51.0, 35.0, 38.0, 27.0, 20.0, 17.0, 10.0, 18.0, 4.0, 9.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0706787109375, -0.06836509704589844, -0.06605148315429688, -0.06373786926269531, -0.06142425537109375, -0.05911064147949219, -0.056797027587890625, -0.05448341369628906, -0.0521697998046875, -0.04985618591308594, -0.047542572021484375, -0.04522895812988281, -0.04291534423828125, -0.04060173034667969, -0.038288116455078125, -0.03597450256347656, -0.033660888671875, -0.03134727478027344, -0.029033660888671875, -0.026720046997070312, -0.02440643310546875, -0.022092819213867188, -0.019779205322265625, -0.017465591430664062, -0.0151519775390625, -0.012838363647460938, -0.010524749755859375, -0.008211135864257812, -0.00589752197265625, -0.0035839080810546875, -0.001270294189453125, 0.0010433197021484375, 0.00335693359375, 0.0056705474853515625, 0.007984161376953125, 0.010297775268554688, 0.01261138916015625, 0.014925003051757812, 0.017238616943359375, 0.019552230834960938, 0.0218658447265625, 0.024179458618164062, 0.026493072509765625, 0.028806686401367188, 0.03112030029296875, 0.03343391418457031, 0.035747528076171875, 0.03806114196777344, 0.040374755859375, 0.04268836975097656, 0.045001983642578125, 0.04731559753417969, 0.04962921142578125, 0.05194282531738281, 0.054256439208984375, 0.05657005310058594, 0.0588836669921875, 0.06119728088378906, 0.06351089477539062, 0.06582450866699219, 0.06813812255859375, 0.07045173645019531, 0.07276535034179688, 0.07507896423339844, 0.077392578125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 7.0, 42.0, 115.0, 360.0, 321.0, 112.0, 39.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1859989166259766, -1.067253828048706, -0.9485087394714355, -0.8297635912895203, -0.7110185027122498, -0.5922734141349792, -0.47352826595306396, -0.35478317737579346, -0.23603808879852295, -0.11729298532009125, 0.001452118158340454, 0.12019723653793335, 0.23894232511520386, 0.35768741369247437, 0.47643256187438965, 0.5951776504516602, 0.7139227390289307, 0.8326678276062012, 0.9514129161834717, 1.0701580047607422, 1.1889030933380127, 1.3076481819152832, 1.4263933897018433, 1.5451384782791138, 1.6638835668563843, 1.7826286554336548, 1.9013737440109253, 2.0201189517974854, 2.138864040374756, 2.2576091289520264, 2.376354217529297, 2.4950993061065674, 2.613844394683838, 2.7325894832611084, 2.851334571838379, 2.9700796604156494, 3.08882474899292, 3.2075698375701904, 3.326314926147461, 3.4450602531433105, 3.563805103302002, 3.6825501918792725, 3.801295280456543, 3.9200403690338135, 4.038785457611084, 4.157530784606934, 4.276275634765625, 4.395020961761475, 4.513766288757324, 4.632511615753174, 4.751256465911865, 4.870001792907715, 4.988746643066406, 5.107491970062256, 5.226236820220947, 5.344982147216797, 5.463726997375488, 5.582472324371338, 5.701217174530029, 5.819962501525879, 5.93870735168457, 6.05745267868042, 6.176197528839111, 6.294942855834961, 6.413687705993652]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 6.0, 5.0, 5.0, 11.0, 6.0, 13.0, 5.0, 17.0, 17.0, 20.0, 18.0, 20.0, 20.0, 29.0, 35.0, 36.0, 30.0, 43.0, 62.0, 47.0, 48.0, 35.0, 42.0, 33.0, 36.0, 59.0, 35.0, 29.0, 29.0, 32.0, 32.0, 19.0, 18.0, 17.0, 9.0, 20.0, 12.0, 11.0, 9.0, 9.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.008568525314331, -0.9773091077804565, -0.946049690246582, -0.9147902727127075, -0.8835309147834778, -0.8522714972496033, -0.8210120797157288, -0.7897526621818542, -0.7584933042526245, -0.72723388671875, -0.6959744691848755, -0.664715051651001, -0.6334556937217712, -0.6021962761878967, -0.5709368586540222, -0.5396774411201477, -0.5084180235862732, -0.4771586060523987, -0.44589921832084656, -0.41463980078697205, -0.3833804130554199, -0.3521209955215454, -0.3208615779876709, -0.2896021604537964, -0.25834277272224426, -0.22708337008953094, -0.19582396745681763, -0.16456454992294312, -0.1333051472902298, -0.10204574465751648, -0.07078632712364197, -0.03952692449092865, -0.008267462253570557, 0.02299194410443306, 0.054251350462436676, 0.08551076054573059, 0.11677016317844391, 0.14802956581115723, 0.17928898334503174, 0.21054838597774506, 0.24180778861045837, 0.2730672061443329, 0.304326593875885, 0.3355860114097595, 0.36684542894363403, 0.39810481667518616, 0.42936423420906067, 0.4606236219406128, 0.4918830394744873, 0.5231424570083618, 0.5544018745422363, 0.5856612920761108, 0.6169206500053406, 0.6481800675392151, 0.6794394850730896, 0.7106989026069641, 0.7419582605361938, 0.7732176780700684, 0.8044770956039429, 0.8357365131378174, 0.8669958710670471, 0.8982552886009216, 0.9295147061347961, 0.9607741236686707, 0.9920335412025452]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 10.0, 7.0, 15.0, 14.0, 11.0, 21.0, 37.0, 43.0, 64.0, 81.0, 161.0, 268.0, 515.0, 1078.0, 2728.0, 9965.0, 127609.0, 3999073.0, 42232.0, 6472.0, 2051.0, 859.0, 386.0, 237.0, 124.0, 76.0, 45.0, 21.0, 25.0, 9.0, 10.0, 6.0, 5.0, 5.0, 1.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.60009765625, -0.5835838317871094, -0.5670700073242188, -0.5505561828613281, -0.5340423583984375, -0.5175285339355469, -0.5010147094726562, -0.4845008850097656, -0.467987060546875, -0.4514732360839844, -0.43495941162109375, -0.4184455871582031, -0.4019317626953125, -0.3854179382324219, -0.36890411376953125, -0.3523902893066406, -0.33587646484375, -0.3193626403808594, -0.30284881591796875, -0.2863349914550781, -0.2698211669921875, -0.2533073425292969, -0.23679351806640625, -0.22027969360351562, -0.203765869140625, -0.18725204467773438, -0.17073822021484375, -0.15422439575195312, -0.1377105712890625, -0.12119674682617188, -0.10468292236328125, -0.08816909790039062, -0.0716552734375, -0.055141448974609375, -0.03862762451171875, -0.022113800048828125, -0.0055999755859375, 0.010913848876953125, 0.02742767333984375, 0.043941497802734375, 0.060455322265625, 0.07696914672851562, 0.09348297119140625, 0.10999679565429688, 0.1265106201171875, 0.14302444458007812, 0.15953826904296875, 0.17605209350585938, 0.19256591796875, 0.20907974243164062, 0.22559356689453125, 0.24210739135742188, 0.2586212158203125, 0.2751350402832031, 0.29164886474609375, 0.3081626892089844, 0.324676513671875, 0.3411903381347656, 0.35770416259765625, 0.3742179870605469, 0.3907318115234375, 0.4072456359863281, 0.42375946044921875, 0.4402732849121094, 0.456787109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 21.0, 22.0, 25.0, 27.0, 42.0, 47.0, 52.0, 56.0, 65.0, 92.0, 80.0, 64.0, 90.0, 65.0, 57.0, 45.0, 25.0, 24.0, 24.0, 21.0, 7.0, 11.0, 5.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08526611328125, -0.08284282684326172, -0.08041954040527344, -0.07799625396728516, -0.07557296752929688, -0.0731496810913086, -0.07072639465332031, -0.06830310821533203, -0.06587982177734375, -0.06345653533935547, -0.06103324890136719, -0.058609962463378906, -0.056186676025390625, -0.053763389587402344, -0.05134010314941406, -0.04891681671142578, -0.0464935302734375, -0.04407024383544922, -0.04164695739746094, -0.039223670959472656, -0.036800384521484375, -0.034377098083496094, -0.03195381164550781, -0.02953052520751953, -0.02710723876953125, -0.02468395233154297, -0.022260665893554688, -0.019837379455566406, -0.017414093017578125, -0.014990806579589844, -0.012567520141601562, -0.010144233703613281, -0.007720947265625, -0.005297660827636719, -0.0028743743896484375, -0.00045108795166015625, 0.001972198486328125, 0.004395484924316406, 0.0068187713623046875, 0.009242057800292969, 0.01166534423828125, 0.014088630676269531, 0.016511917114257812, 0.018935203552246094, 0.021358489990234375, 0.023781776428222656, 0.026205062866210938, 0.02862834930419922, 0.0310516357421875, 0.03347492218017578, 0.03589820861816406, 0.038321495056152344, 0.040744781494140625, 0.043168067932128906, 0.04559135437011719, 0.04801464080810547, 0.05043792724609375, 0.05286121368408203, 0.05528450012207031, 0.057707786560058594, 0.060131072998046875, 0.06255435943603516, 0.06497764587402344, 0.06740093231201172, 0.06982421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 5.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 8.0, 13.0, 26.0, 69.0, 125.0, 274.0, 762.0, 2154.0, 7104.0, 41917.0, 3967754.0, 155957.0, 12838.0, 3439.0, 1102.0, 389.0, 164.0, 70.0, 29.0, 28.0, 14.0, 6.0, 5.0, 7.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.470458984375, -0.4521522521972656, -0.43384552001953125, -0.4155387878417969, -0.3972320556640625, -0.3789253234863281, -0.36061859130859375, -0.3423118591308594, -0.324005126953125, -0.3056983947753906, -0.28739166259765625, -0.2690849304199219, -0.2507781982421875, -0.23247146606445312, -0.21416473388671875, -0.19585800170898438, -0.17755126953125, -0.15924453735351562, -0.14093780517578125, -0.12263107299804688, -0.1043243408203125, -0.08601760864257812, -0.06771087646484375, -0.049404144287109375, -0.031097412109375, -0.012790679931640625, 0.00551605224609375, 0.023822784423828125, 0.0421295166015625, 0.060436248779296875, 0.07874298095703125, 0.09704971313476562, 0.1153564453125, 0.13366317749023438, 0.15196990966796875, 0.17027664184570312, 0.1885833740234375, 0.20689010620117188, 0.22519683837890625, 0.24350357055664062, 0.261810302734375, 0.2801170349121094, 0.29842376708984375, 0.3167304992675781, 0.3350372314453125, 0.3533439636230469, 0.37165069580078125, 0.3899574279785156, 0.40826416015625, 0.4265708923339844, 0.44487762451171875, 0.4631843566894531, 0.4814910888671875, 0.4997978210449219, 0.5181045532226562, 0.5364112854003906, 0.554718017578125, 0.5730247497558594, 0.5913314819335938, 0.6096382141113281, 0.6279449462890625, 0.6462516784667969, 0.6645584106445312, 0.6828651428222656, 0.701171875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 8.0, 7.0, 12.0, 14.0, 26.0, 31.0, 46.0, 95.0, 301.0, 1295.0, 1500.0, 415.0, 124.0, 59.0, 40.0, 27.0, 10.0, 12.0, 11.0, 3.0, 2.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.118408203125, -0.11386489868164062, -0.10932159423828125, -0.10477828979492188, -0.1002349853515625, -0.09569168090820312, -0.09114837646484375, -0.08660507202148438, -0.082061767578125, -0.07751846313476562, -0.07297515869140625, -0.06843185424804688, -0.0638885498046875, -0.059345245361328125, -0.05480194091796875, -0.050258636474609375, -0.04571533203125, -0.041172027587890625, -0.03662872314453125, -0.032085418701171875, -0.0275421142578125, -0.022998809814453125, -0.01845550537109375, -0.013912200927734375, -0.009368896484375, -0.004825592041015625, -0.00028228759765625, 0.004261016845703125, 0.0088043212890625, 0.013347625732421875, 0.01789093017578125, 0.022434234619140625, 0.0269775390625, 0.031520843505859375, 0.03606414794921875, 0.040607452392578125, 0.0451507568359375, 0.049694061279296875, 0.05423736572265625, 0.058780670166015625, 0.063323974609375, 0.06786727905273438, 0.07241058349609375, 0.07695388793945312, 0.0814971923828125, 0.08604049682617188, 0.09058380126953125, 0.09512710571289062, 0.09967041015625, 0.10421371459960938, 0.10875701904296875, 0.11330032348632812, 0.1178436279296875, 0.12238693237304688, 0.12693023681640625, 0.13147354125976562, 0.136016845703125, 0.14056015014648438, 0.14510345458984375, 0.14964675903320312, 0.1541900634765625, 0.15873336791992188, 0.16327667236328125, 0.16781997680664062, 0.17236328125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 33.0, 384.0, 504.0, 63.0, 15.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9903552532196045, -3.8765792846679688, -3.762803316116333, -3.6490275859832764, -3.5352516174316406, -3.421475648880005, -3.307699680328369, -3.1939239501953125, -3.0801479816436768, -2.966372013092041, -2.8525960445404053, -2.7388203144073486, -2.625044345855713, -2.511268377304077, -2.3974924087524414, -2.2837166786193848, -2.16994047164917, -2.056164503097534, -1.942388653755188, -1.8286126852035522, -1.714836835861206, -1.6010608673095703, -1.4872848987579346, -1.3735090494155884, -1.2597332000732422, -1.1459572315216064, -1.0321813821792603, -0.9184054136276245, -0.8046295642852783, -0.6908535957336426, -0.5770776867866516, -0.46330177783966064, -0.34952592849731445, -0.2357500195503235, -0.12197409570217133, -0.008198171854019165, 0.1055777370929718, 0.21935367584228516, 0.3331295847892761, 0.4469054937362671, 0.5606814026832581, 0.674457311630249, 0.78823322057724, 0.902009129524231, 1.0157850980758667, 1.129560947418213, 1.2433369159698486, 1.3571128845214844, 1.4708887338638306, 1.5846647024154663, 1.6984405517578125, 1.8122165203094482, 1.9259923696517944, 2.0397682189941406, 2.1535441875457764, 2.267320156097412, 2.381096124649048, 2.4948720932006836, 2.6086480617523193, 2.722423791885376, 2.8361997604370117, 2.9499757289886475, 3.063751697540283, 3.17752742767334, 3.2913033962249756]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 3.0, 7.0, 9.0, 13.0, 20.0, 15.0, 28.0, 25.0, 32.0, 38.0, 35.0, 36.0, 59.0, 51.0, 62.0, 74.0, 57.0, 63.0, 49.0, 49.0, 50.0, 45.0, 33.0, 35.0, 33.0, 18.0, 15.0, 10.0, 14.0, 8.0, 5.0, 6.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3858994245529175, -0.37095364928245544, -0.356007844209671, -0.341062068939209, -0.32611626386642456, -0.3111704885959625, -0.2962246835231781, -0.28127890825271606, -0.26633310317993164, -0.2513873279094696, -0.23644152283668518, -0.22149573266506195, -0.20654994249343872, -0.19160416722297668, -0.17665836215019226, -0.16171258687973022, -0.146766796708107, -0.13182100653648376, -0.11687521636486053, -0.1019294261932373, -0.08698363602161407, -0.07203785330057144, -0.05709206312894821, -0.04214627295732498, -0.02720048278570175, -0.012254693545401096, 0.002691095694899559, 0.01763688400387764, 0.03258267417550087, 0.0475284606218338, 0.06247425079345703, 0.07742004096508026, 0.09236583113670349, 0.10731162130832672, 0.12225741147994995, 0.13720320165157318, 0.1521489918231964, 0.16709476709365845, 0.18204057216644287, 0.1969863474369049, 0.21193215250968933, 0.22687794268131256, 0.2418237328529358, 0.2567695081233978, 0.27171531319618225, 0.2866610884666443, 0.3016068935394287, 0.31655266880989075, 0.3314984440803528, 0.3464442193508148, 0.36139002442359924, 0.3763357996940613, 0.3912816047668457, 0.40622738003730774, 0.42117318511009216, 0.4361189603805542, 0.4510647654533386, 0.46601054072380066, 0.4809563457965851, 0.4959021210670471, 0.5108479261398315, 0.525793731212616, 0.5407394766807556, 0.55568528175354, 0.5706310868263245]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 5.0, 15.0, 10.0, 19.0, 35.0, 43.0, 59.0, 107.0, 143.0, 272.0, 501.0, 1103.0, 2512.0, 7522.0, 35091.0, 266983.0, 615599.0, 95077.0, 15947.0, 4253.0, 1598.0, 753.0, 382.0, 190.0, 115.0, 64.0, 53.0, 23.0, 30.0, 7.0, 12.0, 6.0, 8.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3798828125, -0.3673286437988281, -0.35477447509765625, -0.3422203063964844, -0.3296661376953125, -0.3171119689941406, -0.30455780029296875, -0.2920036315917969, -0.279449462890625, -0.2668952941894531, -0.25434112548828125, -0.24178695678710938, -0.2292327880859375, -0.21667861938476562, -0.20412445068359375, -0.19157028198242188, -0.17901611328125, -0.16646194458007812, -0.15390777587890625, -0.14135360717773438, -0.1287994384765625, -0.11624526977539062, -0.10369110107421875, -0.09113693237304688, -0.078582763671875, -0.06602859497070312, -0.05347442626953125, -0.040920257568359375, -0.0283660888671875, -0.015811920166015625, -0.00325775146484375, 0.009296417236328125, 0.0218505859375, 0.034404754638671875, 0.04695892333984375, 0.059513092041015625, 0.0720672607421875, 0.08462142944335938, 0.09717559814453125, 0.10972976684570312, 0.122283935546875, 0.13483810424804688, 0.14739227294921875, 0.15994644165039062, 0.1725006103515625, 0.18505477905273438, 0.19760894775390625, 0.21016311645507812, 0.22271728515625, 0.23527145385742188, 0.24782562255859375, 0.2603797912597656, 0.2729339599609375, 0.2854881286621094, 0.29804229736328125, 0.3105964660644531, 0.323150634765625, 0.3357048034667969, 0.34825897216796875, 0.3608131408691406, 0.3733673095703125, 0.3859214782714844, 0.39847564697265625, 0.4110298156738281, 0.423583984375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 7.0, 4.0, 10.0, 15.0, 22.0, 24.0, 33.0, 37.0, 37.0, 47.0, 49.0, 71.0, 82.0, 77.0, 72.0, 77.0, 70.0, 63.0, 44.0, 44.0, 30.0, 27.0, 27.0, 14.0, 11.0, 5.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09088134765625, -0.08833789825439453, -0.08579444885253906, -0.0832509994506836, -0.08070755004882812, -0.07816410064697266, -0.07562065124511719, -0.07307720184326172, -0.07053375244140625, -0.06799030303955078, -0.06544685363769531, -0.06290340423583984, -0.060359954833984375, -0.057816505432128906, -0.05527305603027344, -0.05272960662841797, -0.0501861572265625, -0.04764270782470703, -0.04509925842285156, -0.042555809020996094, -0.040012359619140625, -0.037468910217285156, -0.03492546081542969, -0.03238201141357422, -0.02983856201171875, -0.02729511260986328, -0.024751663208007812, -0.022208213806152344, -0.019664764404296875, -0.017121315002441406, -0.014577865600585938, -0.012034416198730469, -0.009490966796875, -0.006947517395019531, -0.0044040679931640625, -0.0018606185913085938, 0.000682830810546875, 0.0032262802124023438, 0.0057697296142578125, 0.008313179016113281, 0.01085662841796875, 0.013400077819824219, 0.015943527221679688, 0.018486976623535156, 0.021030426025390625, 0.023573875427246094, 0.026117324829101562, 0.02866077423095703, 0.0312042236328125, 0.03374767303466797, 0.03629112243652344, 0.038834571838378906, 0.041378021240234375, 0.043921470642089844, 0.04646492004394531, 0.04900836944580078, 0.05155181884765625, 0.05409526824951172, 0.05663871765136719, 0.059182167053222656, 0.061725616455078125, 0.0642690658569336, 0.06681251525878906, 0.06935596466064453, 0.0718994140625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 1.0, 8.0, 4.0, 7.0, 14.0, 12.0, 18.0, 39.0, 49.0, 100.0, 207.0, 426.0, 1175.0, 3761.0, 15300.0, 94914.0, 579257.0, 300934.0, 40618.0, 8096.0, 2222.0, 701.0, 308.0, 152.0, 79.0, 40.0, 30.0, 17.0, 6.0, 10.0, 13.0, 7.0, 2.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.282958984375, -0.27405548095703125, -0.2651519775390625, -0.25624847412109375, -0.247344970703125, -0.23844146728515625, -0.2295379638671875, -0.22063446044921875, -0.21173095703125, -0.20282745361328125, -0.1939239501953125, -0.18502044677734375, -0.176116943359375, -0.16721343994140625, -0.1583099365234375, -0.14940643310546875, -0.1405029296875, -0.13159942626953125, -0.1226959228515625, -0.11379241943359375, -0.104888916015625, -0.09598541259765625, -0.0870819091796875, -0.07817840576171875, -0.06927490234375, -0.06037139892578125, -0.0514678955078125, -0.04256439208984375, -0.033660888671875, -0.02475738525390625, -0.0158538818359375, -0.00695037841796875, 0.001953125, 0.01085662841796875, 0.0197601318359375, 0.02866363525390625, 0.037567138671875, 0.04647064208984375, 0.0553741455078125, 0.06427764892578125, 0.07318115234375, 0.08208465576171875, 0.0909881591796875, 0.09989166259765625, 0.108795166015625, 0.11769866943359375, 0.1266021728515625, 0.13550567626953125, 0.1444091796875, 0.15331268310546875, 0.1622161865234375, 0.17111968994140625, 0.180023193359375, 0.18892669677734375, 0.1978302001953125, 0.20673370361328125, 0.21563720703125, 0.22454071044921875, 0.2334442138671875, 0.24234771728515625, 0.251251220703125, 0.26015472412109375, 0.2690582275390625, 0.27796173095703125, 0.286865234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 4.0, 8.0, 9.0, 19.0, 10.0, 12.0, 10.0, 16.0, 29.0, 27.0, 30.0, 26.0, 27.0, 39.0, 39.0, 37.0, 40.0, 41.0, 52.0, 56.0, 54.0, 39.0, 34.0, 46.0, 33.0, 36.0, 40.0, 20.0, 22.0, 31.0, 23.0, 15.0, 7.0, 17.0, 13.0, 5.0, 7.0, 4.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-0.18603515625, -0.17991256713867188, -0.17378997802734375, -0.16766738891601562, -0.1615447998046875, -0.15542221069335938, -0.14929962158203125, -0.14317703247070312, -0.137054443359375, -0.13093185424804688, -0.12480926513671875, -0.11868667602539062, -0.1125640869140625, -0.10644149780273438, -0.10031890869140625, -0.09419631958007812, -0.08807373046875, -0.08195114135742188, -0.07582855224609375, -0.06970596313476562, -0.0635833740234375, -0.057460784912109375, -0.05133819580078125, -0.045215606689453125, -0.039093017578125, -0.032970428466796875, -0.02684783935546875, -0.020725250244140625, -0.0146026611328125, -0.008480072021484375, -0.00235748291015625, 0.003765106201171875, 0.0098876953125, 0.016010284423828125, 0.02213287353515625, 0.028255462646484375, 0.0343780517578125, 0.040500640869140625, 0.04662322998046875, 0.052745819091796875, 0.058868408203125, 0.06499099731445312, 0.07111358642578125, 0.07723617553710938, 0.0833587646484375, 0.08948135375976562, 0.09560394287109375, 0.10172653198242188, 0.10784912109375, 0.11397171020507812, 0.12009429931640625, 0.12621688842773438, 0.1323394775390625, 0.13846206665039062, 0.14458465576171875, 0.15070724487304688, 0.156829833984375, 0.16295242309570312, 0.16907501220703125, 0.17519760131835938, 0.1813201904296875, 0.18744277954101562, 0.19356536865234375, 0.19968795776367188, 0.205810546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 10.0, 9.0, 14.0, 20.0, 55.0, 95.0, 219.0, 484.0, 1473.0, 11484.0, 679693.0, 345891.0, 7124.0, 1175.0, 410.0, 186.0, 109.0, 51.0, 24.0, 15.0, 7.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.290283203125, -0.281463623046875, -0.27264404296875, -0.263824462890625, -0.2550048828125, -0.246185302734375, -0.23736572265625, -0.228546142578125, -0.2197265625, -0.210906982421875, -0.20208740234375, -0.193267822265625, -0.1844482421875, -0.175628662109375, -0.16680908203125, -0.157989501953125, -0.149169921875, -0.140350341796875, -0.13153076171875, -0.122711181640625, -0.1138916015625, -0.105072021484375, -0.09625244140625, -0.087432861328125, -0.07861328125, -0.069793701171875, -0.06097412109375, -0.052154541015625, -0.0433349609375, -0.034515380859375, -0.02569580078125, -0.016876220703125, -0.008056640625, 0.000762939453125, 0.00958251953125, 0.018402099609375, 0.0272216796875, 0.036041259765625, 0.04486083984375, 0.053680419921875, 0.0625, 0.071319580078125, 0.08013916015625, 0.088958740234375, 0.0977783203125, 0.106597900390625, 0.11541748046875, 0.124237060546875, 0.133056640625, 0.141876220703125, 0.15069580078125, 0.159515380859375, 0.1683349609375, 0.177154541015625, 0.18597412109375, 0.194793701171875, 0.20361328125, 0.212432861328125, 0.22125244140625, 0.230072021484375, 0.2388916015625, 0.247711181640625, 0.25653076171875, 0.265350341796875, 0.274169921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 3.0, 6.0, 10.0, 7.0, 8.0, 14.0, 21.0, 24.0, 39.0, 62.0, 93.0, 95.0, 139.0, 122.0, 118.0, 70.0, 56.0, 32.0, 27.0, 16.0, 11.0, 8.0, 5.0, 6.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.996755599975586e-05, -1.9162893295288086e-05, -1.8358230590820312e-05, -1.755356788635254e-05, -1.6748905181884766e-05, -1.5944242477416992e-05, -1.5139579772949219e-05, -1.4334917068481445e-05, -1.3530254364013672e-05, -1.2725591659545898e-05, -1.1920928955078125e-05, -1.1116266250610352e-05, -1.0311603546142578e-05, -9.506940841674805e-06, -8.702278137207031e-06, -7.897615432739258e-06, -7.092952728271484e-06, -6.288290023803711e-06, -5.4836273193359375e-06, -4.678964614868164e-06, -3.874301910400391e-06, -3.069639205932617e-06, -2.2649765014648438e-06, -1.4603137969970703e-06, -6.556510925292969e-07, 1.4901161193847656e-07, 9.5367431640625e-07, 1.7583370208740234e-06, 2.562999725341797e-06, 3.3676624298095703e-06, 4.172325134277344e-06, 4.976987838745117e-06, 5.781650543212891e-06, 6.586313247680664e-06, 7.3909759521484375e-06, 8.195638656616211e-06, 9.000301361083984e-06, 9.804964065551758e-06, 1.0609626770019531e-05, 1.1414289474487305e-05, 1.2218952178955078e-05, 1.3023614883422852e-05, 1.3828277587890625e-05, 1.4632940292358398e-05, 1.5437602996826172e-05, 1.6242265701293945e-05, 1.704692840576172e-05, 1.7851591110229492e-05, 1.8656253814697266e-05, 1.946091651916504e-05, 2.0265579223632812e-05, 2.1070241928100586e-05, 2.187490463256836e-05, 2.2679567337036133e-05, 2.3484230041503906e-05, 2.428889274597168e-05, 2.5093555450439453e-05, 2.5898218154907227e-05, 2.6702880859375e-05, 2.7507543563842773e-05, 2.8312206268310547e-05, 2.911686897277832e-05, 2.9921531677246094e-05, 3.072619438171387e-05, 3.153085708618164e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 8.0, 17.0, 15.0, 20.0, 46.0, 77.0, 152.0, 243.0, 505.0, 1687.0, 17920.0, 769254.0, 249616.0, 7060.0, 1061.0, 385.0, 204.0, 125.0, 83.0, 36.0, 26.0, 14.0, 4.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.37744140625, -0.3688316345214844, -0.36022186279296875, -0.3516120910644531, -0.3430023193359375, -0.3343925476074219, -0.32578277587890625, -0.3171730041503906, -0.308563232421875, -0.2999534606933594, -0.29134368896484375, -0.2827339172363281, -0.2741241455078125, -0.2655143737792969, -0.25690460205078125, -0.24829483032226562, -0.23968505859375, -0.23107528686523438, -0.22246551513671875, -0.21385574340820312, -0.2052459716796875, -0.19663619995117188, -0.18802642822265625, -0.17941665649414062, -0.170806884765625, -0.16219711303710938, -0.15358734130859375, -0.14497756958007812, -0.1363677978515625, -0.12775802612304688, -0.11914825439453125, -0.11053848266601562, -0.1019287109375, -0.09331893920898438, -0.08470916748046875, -0.07609939575195312, -0.0674896240234375, -0.058879852294921875, -0.05027008056640625, -0.041660308837890625, -0.033050537109375, -0.024440765380859375, -0.01583099365234375, -0.007221221923828125, 0.0013885498046875, 0.009998321533203125, 0.01860809326171875, 0.027217864990234375, 0.03582763671875, 0.044437408447265625, 0.05304718017578125, 0.061656951904296875, 0.0702667236328125, 0.07887649536132812, 0.08748626708984375, 0.09609603881835938, 0.104705810546875, 0.11331558227539062, 0.12192535400390625, 0.13053512573242188, 0.1391448974609375, 0.14775466918945312, 0.15636444091796875, 0.16497421264648438, 0.173583984375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 9.0, 12.0, 15.0, 23.0, 68.0, 135.0, 191.0, 213.0, 175.0, 76.0, 49.0, 24.0, 11.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2154541015625, -0.20830726623535156, -0.20116043090820312, -0.1940135955810547, -0.18686676025390625, -0.1797199249267578, -0.17257308959960938, -0.16542625427246094, -0.1582794189453125, -0.15113258361816406, -0.14398574829101562, -0.1368389129638672, -0.12969207763671875, -0.12254524230957031, -0.11539840698242188, -0.10825157165527344, -0.101104736328125, -0.09395790100097656, -0.08681106567382812, -0.07966423034667969, -0.07251739501953125, -0.06537055969238281, -0.058223724365234375, -0.05107688903808594, -0.0439300537109375, -0.03678321838378906, -0.029636383056640625, -0.022489547729492188, -0.01534271240234375, -0.008195877075195312, -0.001049041748046875, 0.0060977935791015625, 0.01324462890625, 0.020391464233398438, 0.027538299560546875, 0.03468513488769531, 0.04183197021484375, 0.04897880554199219, 0.056125640869140625, 0.06327247619628906, 0.0704193115234375, 0.07756614685058594, 0.08471298217773438, 0.09185981750488281, 0.09900665283203125, 0.10615348815917969, 0.11330032348632812, 0.12044715881347656, 0.127593994140625, 0.13474082946777344, 0.14188766479492188, 0.1490345001220703, 0.15618133544921875, 0.1633281707763672, 0.17047500610351562, 0.17762184143066406, 0.1847686767578125, 0.19191551208496094, 0.19906234741210938, 0.2062091827392578, 0.21335601806640625, 0.2205028533935547, 0.22764968872070312, 0.23479652404785156, 0.241943359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 10.0, 27.0, 47.0, 88.0, 133.0, 171.0, 200.0, 151.0, 98.0, 40.0, 23.0, 8.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2097201347351074, -1.1464424133300781, -1.0831648111343384, -1.0198872089385986, -0.9566094875335693, -0.8933318257331848, -0.8300541639328003, -0.7667765021324158, -0.7034988403320312, -0.6402211785316467, -0.5769435167312622, -0.5136658549308777, -0.45038819313049316, -0.38711053133010864, -0.3238328695297241, -0.2605552077293396, -0.19727754592895508, -0.13399988412857056, -0.07072222232818604, -0.007444560527801514, 0.05583310127258301, 0.11911076307296753, 0.18238842487335205, 0.24566608667373657, 0.3089437484741211, 0.3722214102745056, 0.43549907207489014, 0.49877673387527466, 0.5620543956756592, 0.6253320574760437, 0.6886097192764282, 0.7518873810768127, 0.8151650428771973, 0.8784427046775818, 0.9417203664779663, 1.004997968673706, 1.0682756900787354, 1.1315534114837646, 1.1948310136795044, 1.2581086158752441, 1.3213863372802734, 1.3846640586853027, 1.4479416608810425, 1.5112192630767822, 1.5744969844818115, 1.6377747058868408, 1.7010523080825806, 1.7643299102783203, 1.8276076316833496, 1.890885353088379, 1.9541629552841187, 2.0174405574798584, 2.0807182788848877, 2.143996000289917, 2.207273483276367, 2.2705512046813965, 2.333828926086426, 2.397106647491455, 2.4603843688964844, 2.5236618518829346, 2.586939573287964, 2.650217294692993, 2.7134947776794434, 2.7767724990844727, 2.840050220489502]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 6.0, 2.0, 5.0, 9.0, 11.0, 14.0, 11.0, 16.0, 20.0, 21.0, 29.0, 19.0, 33.0, 36.0, 43.0, 48.0, 51.0, 47.0, 45.0, 61.0, 46.0, 35.0, 39.0, 50.0, 27.0, 37.0, 34.0, 30.0, 28.0, 22.0, 24.0, 12.0, 21.0, 15.0, 17.0, 13.0, 8.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.050001621246338, -1.0169678926467896, -0.983934223651886, -0.9509005546569824, -0.9178668260574341, -0.8848330974578857, -0.8517994284629822, -0.8187657594680786, -0.7857320308685303, -0.7526983022689819, -0.7196646332740784, -0.6866309642791748, -0.6535972356796265, -0.6205635070800781, -0.5875298380851746, -0.554496169090271, -0.5214624404907227, -0.4884287416934967, -0.45539504289627075, -0.4223613440990448, -0.38932764530181885, -0.3562939465045929, -0.32326024770736694, -0.290226548910141, -0.25719285011291504, -0.2241591513156891, -0.19112545251846313, -0.15809175372123718, -0.12505805492401123, -0.09202435612678528, -0.058990657329559326, -0.025956958532333374, 0.007076621055603027, 0.04011031985282898, 0.07314401865005493, 0.10617771744728088, 0.13921141624450684, 0.1722451150417328, 0.20527881383895874, 0.2383125126361847, 0.27134621143341064, 0.3043799102306366, 0.33741360902786255, 0.3704473078250885, 0.40348100662231445, 0.4365147054195404, 0.46954840421676636, 0.5025820732116699, 0.5356158018112183, 0.5686495304107666, 0.6016831994056702, 0.6347168684005737, 0.6677505970001221, 0.7007843255996704, 0.733817994594574, 0.7668516635894775, 0.7998853921890259, 0.8329191207885742, 0.8659527897834778, 0.8989864587783813, 0.9320201873779297, 0.965053915977478, 0.9980875849723816, 1.0311212539672852, 1.0641549825668335]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 4.0, 11.0, 13.0, 11.0, 9.0, 13.0, 25.0, 28.0, 44.0, 64.0, 130.0, 210.0, 322.0, 630.0, 1431.0, 3816.0, 22938.0, 4121273.0, 35220.0, 4771.0, 1679.0, 738.0, 383.0, 193.0, 107.0, 74.0, 37.0, 28.0, 12.0, 9.0, 5.0, 8.0, 8.0, 4.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.0830078125, -1.0549240112304688, -1.0268402099609375, -0.9987564086914062, -0.970672607421875, -0.9425888061523438, -0.9145050048828125, -0.8864212036132812, -0.85833740234375, -0.8302536010742188, -0.8021697998046875, -0.7740859985351562, -0.746002197265625, -0.7179183959960938, -0.6898345947265625, -0.6617507934570312, -0.6336669921875, -0.6055831909179688, -0.5774993896484375, -0.5494155883789062, -0.521331787109375, -0.49324798583984375, -0.4651641845703125, -0.43708038330078125, -0.40899658203125, -0.38091278076171875, -0.3528289794921875, -0.32474517822265625, -0.296661376953125, -0.26857757568359375, -0.2404937744140625, -0.21240997314453125, -0.184326171875, -0.15624237060546875, -0.1281585693359375, -0.10007476806640625, -0.071990966796875, -0.04390716552734375, -0.0158233642578125, 0.01226043701171875, 0.04034423828125, 0.06842803955078125, 0.0965118408203125, 0.12459564208984375, 0.152679443359375, 0.18076324462890625, 0.2088470458984375, 0.23693084716796875, 0.2650146484375, 0.29309844970703125, 0.3211822509765625, 0.34926605224609375, 0.377349853515625, 0.40543365478515625, 0.4335174560546875, 0.46160125732421875, 0.48968505859375, 0.5177688598632812, 0.5458526611328125, 0.5739364624023438, 0.602020263671875, 0.6301040649414062, 0.6581878662109375, 0.6862716674804688, 0.71435546875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 11.0, 11.0, 17.0, 17.0, 27.0, 23.0, 38.0, 32.0, 44.0, 51.0, 65.0, 66.0, 75.0, 76.0, 83.0, 53.0, 55.0, 61.0, 40.0, 31.0, 33.0, 23.0, 22.0, 14.0, 9.0, 7.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0838623046875, -0.08146286010742188, -0.07906341552734375, -0.07666397094726562, -0.0742645263671875, -0.07186508178710938, -0.06946563720703125, -0.06706619262695312, -0.064666748046875, -0.062267303466796875, -0.05986785888671875, -0.057468414306640625, -0.0550689697265625, -0.052669525146484375, -0.05027008056640625, -0.047870635986328125, -0.04547119140625, -0.043071746826171875, -0.04067230224609375, -0.038272857666015625, -0.0358734130859375, -0.033473968505859375, -0.03107452392578125, -0.028675079345703125, -0.026275634765625, -0.023876190185546875, -0.02147674560546875, -0.019077301025390625, -0.0166778564453125, -0.014278411865234375, -0.01187896728515625, -0.009479522705078125, -0.007080078125, -0.004680633544921875, -0.00228118896484375, 0.000118255615234375, 0.0025177001953125, 0.004917144775390625, 0.00731658935546875, 0.009716033935546875, 0.012115478515625, 0.014514923095703125, 0.01691436767578125, 0.019313812255859375, 0.0217132568359375, 0.024112701416015625, 0.02651214599609375, 0.028911590576171875, 0.03131103515625, 0.033710479736328125, 0.03610992431640625, 0.038509368896484375, 0.0409088134765625, 0.043308258056640625, 0.04570770263671875, 0.048107147216796875, 0.050506591796875, 0.052906036376953125, 0.05530548095703125, 0.057704925537109375, 0.0601043701171875, 0.06250381469726562, 0.06490325927734375, 0.06730270385742188, 0.0697021484375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 7.0, 15.0, 27.0, 44.0, 78.0, 114.0, 230.0, 491.0, 1152.0, 3544.0, 14142.0, 239436.0, 3899295.0, 26987.0, 5696.0, 1697.0, 670.0, 288.0, 158.0, 73.0, 67.0, 25.0, 16.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67578125, -0.6541061401367188, -0.6324310302734375, -0.6107559204101562, -0.589080810546875, -0.5674057006835938, -0.5457305908203125, -0.5240554809570312, -0.50238037109375, -0.48070526123046875, -0.4590301513671875, -0.43735504150390625, -0.415679931640625, -0.39400482177734375, -0.3723297119140625, -0.35065460205078125, -0.3289794921875, -0.30730438232421875, -0.2856292724609375, -0.26395416259765625, -0.242279052734375, -0.22060394287109375, -0.1989288330078125, -0.17725372314453125, -0.15557861328125, -0.13390350341796875, -0.1122283935546875, -0.09055328369140625, -0.068878173828125, -0.04720306396484375, -0.0255279541015625, -0.00385284423828125, 0.017822265625, 0.03949737548828125, 0.0611724853515625, 0.08284759521484375, 0.104522705078125, 0.12619781494140625, 0.1478729248046875, 0.16954803466796875, 0.19122314453125, 0.21289825439453125, 0.2345733642578125, 0.25624847412109375, 0.277923583984375, 0.29959869384765625, 0.3212738037109375, 0.34294891357421875, 0.3646240234375, 0.38629913330078125, 0.4079742431640625, 0.42964935302734375, 0.451324462890625, 0.47299957275390625, 0.4946746826171875, 0.5163497924804688, 0.53802490234375, 0.5597000122070312, 0.5813751220703125, 0.6030502319335938, 0.624725341796875, 0.6464004516601562, 0.6680755615234375, 0.6897506713867188, 0.71142578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 4.0, 5.0, 6.0, 5.0, 15.0, 16.0, 26.0, 49.0, 119.0, 489.0, 2308.0, 680.0, 170.0, 64.0, 24.0, 25.0, 15.0, 10.0, 8.0, 7.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.152587890625, -0.1476001739501953, -0.14261245727539062, -0.13762474060058594, -0.13263702392578125, -0.12764930725097656, -0.12266159057617188, -0.11767387390136719, -0.1126861572265625, -0.10769844055175781, -0.10271072387695312, -0.09772300720214844, -0.09273529052734375, -0.08774757385253906, -0.08275985717773438, -0.07777214050292969, -0.072784423828125, -0.06779670715332031, -0.06280899047851562, -0.05782127380371094, -0.05283355712890625, -0.04784584045410156, -0.042858123779296875, -0.03787040710449219, -0.0328826904296875, -0.027894973754882812, -0.022907257080078125, -0.017919540405273438, -0.01293182373046875, -0.007944107055664062, -0.002956390380859375, 0.0020313262939453125, 0.00701904296875, 0.012006759643554688, 0.016994476318359375, 0.021982192993164062, 0.02696990966796875, 0.03195762634277344, 0.036945343017578125, 0.04193305969238281, 0.0469207763671875, 0.05190849304199219, 0.056896209716796875, 0.06188392639160156, 0.06687164306640625, 0.07185935974121094, 0.07684707641601562, 0.08183479309082031, 0.086822509765625, 0.09181022644042969, 0.09679794311523438, 0.10178565979003906, 0.10677337646484375, 0.11176109313964844, 0.11674880981445312, 0.12173652648925781, 0.1267242431640625, 0.1317119598388672, 0.13669967651367188, 0.14168739318847656, 0.14667510986328125, 0.15166282653808594, 0.15665054321289062, 0.1616382598876953, 0.1666259765625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 12.0, 26.0, 113.0, 363.0, 359.0, 94.0, 25.0, 10.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1445791721343994, -2.0832011699676514, -2.0218231678009033, -1.9604450464248657, -1.8990669250488281, -1.83768892288208, -1.776310920715332, -1.7149327993392944, -1.6535546779632568, -1.5921766757965088, -1.5307985544204712, -1.4694205522537231, -1.4080424308776855, -1.3466644287109375, -1.2852864265441895, -1.2239083051681519, -1.1625303030014038, -1.1011523008346558, -1.0397741794586182, -0.9783961772918701, -0.9170180559158325, -0.8556400537490845, -0.7942619919776917, -0.7328839302062988, -0.671505868434906, -0.6101278066635132, -0.5487497448921204, -0.4873717129230499, -0.4259936511516571, -0.3646155893802643, -0.30323755741119385, -0.24185949563980103, -0.1804814338684082, -0.11910337954759598, -0.05772532522678375, 0.003652721643447876, 0.0650307834148407, 0.12640884518623352, 0.18778687715530396, 0.24916493892669678, 0.3105430006980896, 0.3719210624694824, 0.43329912424087524, 0.4946771562099457, 0.5560551881790161, 0.6174333095550537, 0.6788113117218018, 0.7401893734931946, 0.8015674352645874, 0.8629454970359802, 0.924323558807373, 0.9857015609741211, 1.0470796823501587, 1.1084576845169067, 1.1698358058929443, 1.2312138080596924, 1.2925918102264404, 1.3539698123931885, 1.415347933769226, 1.4767259359359741, 1.5381040573120117, 1.5994820594787598, 1.6608600616455078, 1.7222381830215454, 1.783616304397583]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 9.0, 7.0, 12.0, 18.0, 26.0, 22.0, 38.0, 51.0, 59.0, 52.0, 64.0, 85.0, 80.0, 68.0, 62.0, 78.0, 63.0, 54.0, 43.0, 32.0, 19.0, 16.0, 15.0, 6.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.7172259092330933, -0.6996572017669678, -0.6820884943008423, -0.6645197868347168, -0.6469510793685913, -0.6293823719024658, -0.6118136644363403, -0.5942448973655701, -0.5766761898994446, -0.5591074824333191, -0.5415387749671936, -0.5239700675010681, -0.5064013600349426, -0.48883262276649475, -0.47126391530036926, -0.4536952078342438, -0.4361265003681183, -0.4185577929019928, -0.4009890854358673, -0.38342034816741943, -0.36585164070129395, -0.34828293323516846, -0.33071422576904297, -0.3131455183029175, -0.295576810836792, -0.2780081033706665, -0.260439395904541, -0.24287067353725433, -0.22530195116996765, -0.20773324370384216, -0.19016453623771667, -0.1725958287715912, -0.1550270915031433, -0.13745838403701782, -0.11988966166973114, -0.10232095420360565, -0.08475223928689957, -0.06718352437019348, -0.04961481690406799, -0.03204610198736191, -0.014477387070655823, 0.0030913259834051132, 0.02066003903746605, 0.038228750228881836, 0.05579746514558792, 0.073366180062294, 0.0909348875284195, 0.10850360244512558, 0.12607231736183167, 0.14364102482795715, 0.16120974719524384, 0.17877845466136932, 0.196347177028656, 0.2139158844947815, 0.23148459196090698, 0.24905329942703247, 0.26662200689315796, 0.28419071435928345, 0.30175942182540894, 0.3193281292915344, 0.3368968665599823, 0.3544655740261078, 0.3720342814922333, 0.38960298895835876, 0.40717172622680664]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 1.0, 4.0, 7.0, 13.0, 18.0, 27.0, 33.0, 47.0, 51.0, 91.0, 152.0, 252.0, 410.0, 850.0, 1887.0, 4716.0, 15499.0, 72634.0, 413173.0, 435161.0, 78410.0, 16380.0, 4865.0, 1874.0, 856.0, 452.0, 253.0, 142.0, 83.0, 70.0, 39.0, 31.0, 20.0, 16.0, 8.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.343994140625, -0.3341712951660156, -0.32434844970703125, -0.3145256042480469, -0.3047027587890625, -0.2948799133300781, -0.28505706787109375, -0.2752342224121094, -0.265411376953125, -0.2555885314941406, -0.24576568603515625, -0.23594284057617188, -0.2261199951171875, -0.21629714965820312, -0.20647430419921875, -0.19665145874023438, -0.18682861328125, -0.17700576782226562, -0.16718292236328125, -0.15736007690429688, -0.1475372314453125, -0.13771438598632812, -0.12789154052734375, -0.11806869506835938, -0.108245849609375, -0.09842300415039062, -0.08860015869140625, -0.07877731323242188, -0.0689544677734375, -0.059131622314453125, -0.04930877685546875, -0.039485931396484375, -0.0296630859375, -0.019840240478515625, -0.01001739501953125, -0.000194549560546875, 0.0096282958984375, 0.019451141357421875, 0.02927398681640625, 0.039096832275390625, 0.048919677734375, 0.058742523193359375, 0.06856536865234375, 0.07838821411132812, 0.0882110595703125, 0.09803390502929688, 0.10785675048828125, 0.11767959594726562, 0.12750244140625, 0.13732528686523438, 0.14714813232421875, 0.15697097778320312, 0.1667938232421875, 0.17661666870117188, 0.18643951416015625, 0.19626235961914062, 0.206085205078125, 0.21590805053710938, 0.22573089599609375, 0.23555374145507812, 0.2453765869140625, 0.2551994323730469, 0.26502227783203125, 0.2748451232910156, 0.28466796875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 8.0, 5.0, 8.0, 16.0, 21.0, 16.0, 17.0, 32.0, 36.0, 32.0, 41.0, 48.0, 53.0, 51.0, 65.0, 74.0, 87.0, 62.0, 51.0, 39.0, 52.0, 39.0, 34.0, 27.0, 20.0, 18.0, 18.0, 13.0, 5.0, 7.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07537841796875, -0.07304096221923828, -0.07070350646972656, -0.06836605072021484, -0.06602859497070312, -0.0636911392211914, -0.06135368347167969, -0.05901622772216797, -0.05667877197265625, -0.05434131622314453, -0.05200386047363281, -0.049666404724121094, -0.047328948974609375, -0.044991493225097656, -0.04265403747558594, -0.04031658172607422, -0.0379791259765625, -0.03564167022705078, -0.03330421447753906, -0.030966758728027344, -0.028629302978515625, -0.026291847229003906, -0.023954391479492188, -0.02161693572998047, -0.01927947998046875, -0.01694202423095703, -0.014604568481445312, -0.012267112731933594, -0.009929656982421875, -0.007592201232910156, -0.0052547454833984375, -0.0029172897338867188, -0.000579833984375, 0.0017576217651367188, 0.0040950775146484375, 0.006432533264160156, 0.008769989013671875, 0.011107444763183594, 0.013444900512695312, 0.01578235626220703, 0.01811981201171875, 0.02045726776123047, 0.022794723510742188, 0.025132179260253906, 0.027469635009765625, 0.029807090759277344, 0.03214454650878906, 0.03448200225830078, 0.0368194580078125, 0.03915691375732422, 0.04149436950683594, 0.043831825256347656, 0.046169281005859375, 0.048506736755371094, 0.05084419250488281, 0.05318164825439453, 0.05551910400390625, 0.05785655975341797, 0.06019401550292969, 0.0625314712524414, 0.06486892700195312, 0.06720638275146484, 0.06954383850097656, 0.07188129425048828, 0.07421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 3.0, 3.0, 7.0, 5.0, 4.0, 5.0, 6.0, 12.0, 13.0, 9.0, 12.0, 36.0, 83.0, 118.0, 292.0, 893.0, 3342.0, 14311.0, 80257.0, 491843.0, 384711.0, 57839.0, 10861.0, 2563.0, 746.0, 264.0, 112.0, 58.0, 41.0, 27.0, 18.0, 21.0, 8.0, 5.0, 6.0, 4.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.248046875, -0.23946762084960938, -0.23088836669921875, -0.22230911254882812, -0.2137298583984375, -0.20515060424804688, -0.19657135009765625, -0.18799209594726562, -0.179412841796875, -0.17083358764648438, -0.16225433349609375, -0.15367507934570312, -0.1450958251953125, -0.13651657104492188, -0.12793731689453125, -0.11935806274414062, -0.11077880859375, -0.10219955444335938, -0.09362030029296875, -0.08504104614257812, -0.0764617919921875, -0.06788253784179688, -0.05930328369140625, -0.050724029541015625, -0.042144775390625, -0.033565521240234375, -0.02498626708984375, -0.016407012939453125, -0.0078277587890625, 0.000751495361328125, 0.00933074951171875, 0.017910003662109375, 0.0264892578125, 0.035068511962890625, 0.04364776611328125, 0.052227020263671875, 0.0608062744140625, 0.06938552856445312, 0.07796478271484375, 0.08654403686523438, 0.095123291015625, 0.10370254516601562, 0.11228179931640625, 0.12086105346679688, 0.1294403076171875, 0.13801956176757812, 0.14659881591796875, 0.15517807006835938, 0.16375732421875, 0.17233657836914062, 0.18091583251953125, 0.18949508666992188, 0.1980743408203125, 0.20665359497070312, 0.21523284912109375, 0.22381210327148438, 0.232391357421875, 0.24097061157226562, 0.24954986572265625, 0.2581291198730469, 0.2667083740234375, 0.2752876281738281, 0.28386688232421875, 0.2924461364746094, 0.301025390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 10.0, 5.0, 9.0, 2.0, 6.0, 13.0, 12.0, 20.0, 30.0, 28.0, 25.0, 31.0, 26.0, 26.0, 38.0, 44.0, 50.0, 37.0, 43.0, 71.0, 42.0, 52.0, 32.0, 44.0, 41.0, 38.0, 31.0, 23.0, 20.0, 21.0, 20.0, 22.0, 20.0, 12.0, 14.0, 11.0, 5.0, 5.0, 3.0, 7.0, 7.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.2137584686279297, -0.20693588256835938, -0.20011329650878906, -0.19329071044921875, -0.18646812438964844, -0.17964553833007812, -0.1728229522705078, -0.1660003662109375, -0.1591777801513672, -0.15235519409179688, -0.14553260803222656, -0.13871002197265625, -0.13188743591308594, -0.12506484985351562, -0.11824226379394531, -0.111419677734375, -0.10459709167480469, -0.09777450561523438, -0.09095191955566406, -0.08412933349609375, -0.07730674743652344, -0.07048416137695312, -0.06366157531738281, -0.0568389892578125, -0.05001640319824219, -0.043193817138671875, -0.03637123107910156, -0.02954864501953125, -0.022726058959960938, -0.015903472900390625, -0.009080886840820312, -0.00225830078125, 0.0045642852783203125, 0.011386871337890625, 0.018209457397460938, 0.02503204345703125, 0.03185462951660156, 0.038677215576171875, 0.04549980163574219, 0.0523223876953125, 0.05914497375488281, 0.06596755981445312, 0.07279014587402344, 0.07961273193359375, 0.08643531799316406, 0.09325790405273438, 0.10008049011230469, 0.106903076171875, 0.11372566223144531, 0.12054824829101562, 0.12737083435058594, 0.13419342041015625, 0.14101600646972656, 0.14783859252929688, 0.1546611785888672, 0.1614837646484375, 0.1683063507080078, 0.17512893676757812, 0.18195152282714844, 0.18877410888671875, 0.19559669494628906, 0.20241928100585938, 0.2092418670654297, 0.216064453125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 6.0, 8.0, 9.0, 17.0, 26.0, 44.0, 79.0, 114.0, 227.0, 463.0, 1190.0, 3934.0, 18226.0, 191787.0, 729000.0, 88047.0, 11041.0, 2632.0, 892.0, 376.0, 186.0, 95.0, 50.0, 31.0, 29.0, 13.0, 11.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12361335754394531, -0.11832046508789062, -0.11302757263183594, -0.10773468017578125, -0.10244178771972656, -0.09714889526367188, -0.09185600280761719, -0.0865631103515625, -0.08127021789550781, -0.07597732543945312, -0.07068443298339844, -0.06539154052734375, -0.06009864807128906, -0.054805755615234375, -0.04951286315917969, -0.044219970703125, -0.03892707824707031, -0.033634185791015625, -0.028341293334960938, -0.02304840087890625, -0.017755508422851562, -0.012462615966796875, -0.0071697235107421875, -0.0018768310546875, 0.0034160614013671875, 0.008708953857421875, 0.014001846313476562, 0.01929473876953125, 0.024587631225585938, 0.029880523681640625, 0.03517341613769531, 0.04046630859375, 0.04575920104980469, 0.051052093505859375, 0.05634498596191406, 0.06163787841796875, 0.06693077087402344, 0.07222366333007812, 0.07751655578613281, 0.0828094482421875, 0.08810234069824219, 0.09339523315429688, 0.09868812561035156, 0.10398101806640625, 0.10927391052246094, 0.11456680297851562, 0.11985969543457031, 0.125152587890625, 0.1304454803466797, 0.13573837280273438, 0.14103126525878906, 0.14632415771484375, 0.15161705017089844, 0.15690994262695312, 0.1622028350830078, 0.1674957275390625, 0.1727886199951172, 0.17808151245117188, 0.18337440490722656, 0.18866729736328125, 0.19396018981933594, 0.19925308227539062, 0.2045459747314453, 0.2098388671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 4.0, 5.0, 9.0, 7.0, 6.0, 14.0, 25.0, 23.0, 48.0, 46.0, 79.0, 70.0, 91.0, 96.0, 90.0, 88.0, 69.0, 61.0, 45.0, 26.0, 21.0, 10.0, 15.0, 16.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8358230590820312e-05, -1.7714686691761017e-05, -1.707114279270172e-05, -1.6427598893642426e-05, -1.578405499458313e-05, -1.5140511095523834e-05, -1.4496967196464539e-05, -1.3853423297405243e-05, -1.3209879398345947e-05, -1.2566335499286652e-05, -1.1922791600227356e-05, -1.127924770116806e-05, -1.0635703802108765e-05, -9.992159903049469e-06, -9.348616003990173e-06, -8.705072104930878e-06, -8.061528205871582e-06, -7.417984306812286e-06, -6.774440407752991e-06, -6.130896508693695e-06, -5.487352609634399e-06, -4.843808710575104e-06, -4.200264811515808e-06, -3.5567209124565125e-06, -2.913177013397217e-06, -2.269633114337921e-06, -1.6260892152786255e-06, -9.825453162193298e-07, -3.390014171600342e-07, 3.045424818992615e-07, 9.480863809585571e-07, 1.5916302800178528e-06, 2.2351741790771484e-06, 2.878718078136444e-06, 3.5222619771957397e-06, 4.165805876255035e-06, 4.809349775314331e-06, 5.452893674373627e-06, 6.096437573432922e-06, 6.739981472492218e-06, 7.383525371551514e-06, 8.02706927061081e-06, 8.670613169670105e-06, 9.3141570687294e-06, 9.957700967788696e-06, 1.0601244866847992e-05, 1.1244788765907288e-05, 1.1888332664966583e-05, 1.2531876564025879e-05, 1.3175420463085175e-05, 1.381896436214447e-05, 1.4462508261203766e-05, 1.5106052160263062e-05, 1.5749596059322357e-05, 1.6393139958381653e-05, 1.703668385744095e-05, 1.7680227756500244e-05, 1.832377165555954e-05, 1.8967315554618835e-05, 1.961085945367813e-05, 2.0254403352737427e-05, 2.0897947251796722e-05, 2.1541491150856018e-05, 2.2185035049915314e-05, 2.282857894897461e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 17.0, 18.0, 32.0, 75.0, 98.0, 286.0, 2041.0, 30286.0, 896525.0, 113962.0, 4352.0, 537.0, 152.0, 80.0, 40.0, 31.0, 13.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18115234375, -0.17144775390625, -0.1617431640625, -0.15203857421875, -0.142333984375, -0.13262939453125, -0.1229248046875, -0.11322021484375, -0.103515625, -0.09381103515625, -0.0841064453125, -0.07440185546875, -0.064697265625, -0.05499267578125, -0.0452880859375, -0.03558349609375, -0.02587890625, -0.01617431640625, -0.0064697265625, 0.00323486328125, 0.012939453125, 0.02264404296875, 0.0323486328125, 0.04205322265625, 0.0517578125, 0.06146240234375, 0.0711669921875, 0.08087158203125, 0.090576171875, 0.10028076171875, 0.1099853515625, 0.11968994140625, 0.12939453125, 0.13909912109375, 0.1488037109375, 0.15850830078125, 0.168212890625, 0.17791748046875, 0.1876220703125, 0.19732666015625, 0.20703125, 0.21673583984375, 0.2264404296875, 0.23614501953125, 0.245849609375, 0.25555419921875, 0.2652587890625, 0.27496337890625, 0.28466796875, 0.29437255859375, 0.3040771484375, 0.31378173828125, 0.323486328125, 0.33319091796875, 0.3428955078125, 0.35260009765625, 0.3623046875, 0.37200927734375, 0.3817138671875, 0.39141845703125, 0.401123046875, 0.41082763671875, 0.4205322265625, 0.43023681640625, 0.43994140625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 8.0, 8.0, 17.0, 30.0, 38.0, 74.0, 91.0, 150.0, 132.0, 143.0, 100.0, 68.0, 55.0, 27.0, 25.0, 17.0, 9.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0831298828125, -0.07776832580566406, -0.07240676879882812, -0.06704521179199219, -0.06168365478515625, -0.05632209777832031, -0.050960540771484375, -0.04559898376464844, -0.0402374267578125, -0.03487586975097656, -0.029514312744140625, -0.024152755737304688, -0.01879119873046875, -0.013429641723632812, -0.008068084716796875, -0.0027065277099609375, 0.002655029296875, 0.008016586303710938, 0.013378143310546875, 0.018739700317382812, 0.02410125732421875, 0.029462814331054688, 0.034824371337890625, 0.04018592834472656, 0.0455474853515625, 0.05090904235839844, 0.056270599365234375, 0.06163215637207031, 0.06699371337890625, 0.07235527038574219, 0.07771682739257812, 0.08307838439941406, 0.08843994140625, 0.09380149841308594, 0.09916305541992188, 0.10452461242675781, 0.10988616943359375, 0.11524772644042969, 0.12060928344726562, 0.12597084045410156, 0.1313323974609375, 0.13669395446777344, 0.14205551147460938, 0.1474170684814453, 0.15277862548828125, 0.1581401824951172, 0.16350173950195312, 0.16886329650878906, 0.174224853515625, 0.17958641052246094, 0.18494796752929688, 0.1903095245361328, 0.19567108154296875, 0.2010326385498047, 0.20639419555664062, 0.21175575256347656, 0.2171173095703125, 0.22247886657714844, 0.22784042358398438, 0.2332019805908203, 0.23856353759765625, 0.2439250946044922, 0.24928665161132812, 0.25464820861816406, 0.260009765625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 18.0, 56.0, 160.0, 372.0, 269.0, 92.0, 36.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6088330745697021, -0.479824036359787, -0.3508149981498718, -0.22180595993995667, -0.0927969217300415, 0.03621208667755127, 0.16522115468978882, 0.29423022270202637, 0.42323923110961914, 0.5522482395172119, 0.6812573075294495, 0.810266375541687, 0.9392753839492798, 1.0682843923568726, 1.1972935199737549, 1.3263025283813477, 1.4553115367889404, 1.5843205451965332, 1.713329553604126, 1.8423386812210083, 1.971347689628601, 2.1003565788269043, 2.229365825653076, 2.358374834060669, 2.4873838424682617, 2.6163928508758545, 2.7454018592834473, 2.87441086769104, 3.003419876098633, 3.1324291229248047, 3.2614381313323975, 3.3904471397399902, 3.519455909729004, 3.6484649181365967, 3.7774739265441895, 3.9064829349517822, 4.035491943359375, 4.164501190185547, 4.2935099601745605, 4.422519207000732, 4.551527976989746, 4.680537223815918, 4.809545993804932, 4.9385552406311035, 5.067564010620117, 5.196573257446289, 5.325582027435303, 5.454591274261475, 5.5836005210876465, 5.712609767913818, 5.841618537902832, 5.970627784729004, 6.099636554718018, 6.2286458015441895, 6.357654571533203, 6.486663818359375, 6.615673065185547, 6.744682312011719, 6.873691082000732, 7.002700328826904, 7.131709098815918, 7.26071834564209, 7.3897271156311035, 7.518736362457275, 7.647745132446289]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 4.0, 5.0, 11.0, 8.0, 16.0, 13.0, 14.0, 24.0, 19.0, 24.0, 19.0, 24.0, 37.0, 37.0, 40.0, 50.0, 38.0, 40.0, 46.0, 53.0, 40.0, 39.0, 48.0, 38.0, 39.0, 33.0, 30.0, 27.0, 26.0, 23.0, 27.0, 17.0, 23.0, 11.0, 13.0, 12.0, 6.0, 7.0, 7.0, 3.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.2381360530853271, -1.2033342123031616, -1.168532371520996, -1.1337305307388306, -1.098928689956665, -1.0641268491744995, -1.029325008392334, -0.9945231080055237, -0.9597212672233582, -0.9249194264411926, -0.8901175856590271, -0.8553157448768616, -0.8205138444900513, -0.7857120037078857, -0.7509101629257202, -0.7161083221435547, -0.6813064813613892, -0.6465046405792236, -0.6117027997970581, -0.5769009590148926, -0.542099118232727, -0.5072972774505615, -0.4724953770637512, -0.4376935362815857, -0.40289169549942017, -0.36808985471725464, -0.3332880139350891, -0.2984861433506012, -0.26368430256843567, -0.22888246178627014, -0.19408060610294342, -0.1592787504196167, -0.12447690963745117, -0.08967506140470505, -0.05487321317195892, -0.0200713649392128, 0.014730483293533325, 0.04953232407569885, 0.08433417975902557, 0.1191360354423523, 0.15393787622451782, 0.18873971700668335, 0.22354157269001007, 0.2583434283733368, 0.2931452691555023, 0.32794710993766785, 0.36274898052215576, 0.3975508213043213, 0.4323526620864868, 0.46715450286865234, 0.5019563436508179, 0.5367581844329834, 0.5715600252151489, 0.6063618659973145, 0.6411637663841248, 0.6759656071662903, 0.7107674479484558, 0.7455692887306213, 0.7803711295127869, 0.8151729702949524, 0.8499748706817627, 0.8847767114639282, 0.9195785522460938, 0.9543803930282593, 0.9891822338104248]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 6.0, 6.0, 4.0, 3.0, 8.0, 8.0, 6.0, 14.0, 10.0, 25.0, 16.0, 31.0, 41.0, 55.0, 99.0, 179.0, 319.0, 663.0, 1795.0, 5650.0, 34136.0, 4047056.0, 90385.0, 9372.0, 2510.0, 944.0, 445.0, 191.0, 97.0, 69.0, 40.0, 27.0, 19.0, 18.0, 11.0, 15.0, 5.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.77001953125, -0.7500991821289062, -0.7301788330078125, -0.7102584838867188, -0.690338134765625, -0.6704177856445312, -0.6504974365234375, -0.6305770874023438, -0.61065673828125, -0.5907363891601562, -0.5708160400390625, -0.5508956909179688, -0.530975341796875, -0.5110549926757812, -0.4911346435546875, -0.47121429443359375, -0.4512939453125, -0.43137359619140625, -0.4114532470703125, -0.39153289794921875, -0.371612548828125, -0.35169219970703125, -0.3317718505859375, -0.31185150146484375, -0.29193115234375, -0.27201080322265625, -0.2520904541015625, -0.23217010498046875, -0.212249755859375, -0.19232940673828125, -0.1724090576171875, -0.15248870849609375, -0.132568359375, -0.11264801025390625, -0.0927276611328125, -0.07280731201171875, -0.052886962890625, -0.03296661376953125, -0.0130462646484375, 0.00687408447265625, 0.02679443359375, 0.04671478271484375, 0.0666351318359375, 0.08655548095703125, 0.106475830078125, 0.12639617919921875, 0.1463165283203125, 0.16623687744140625, 0.1861572265625, 0.20607757568359375, 0.2259979248046875, 0.24591827392578125, 0.265838623046875, 0.28575897216796875, 0.3056793212890625, 0.32559967041015625, 0.34552001953125, 0.36544036865234375, 0.3853607177734375, 0.40528106689453125, 0.425201416015625, 0.44512176513671875, 0.4650421142578125, 0.48496246337890625, 0.5048828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 7.0, 6.0, 12.0, 19.0, 19.0, 28.0, 25.0, 37.0, 55.0, 34.0, 59.0, 61.0, 60.0, 72.0, 61.0, 61.0, 62.0, 62.0, 58.0, 46.0, 33.0, 29.0, 28.0, 23.0, 15.0, 8.0, 10.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.084228515625, -0.08167362213134766, -0.07911872863769531, -0.07656383514404297, -0.07400894165039062, -0.07145404815673828, -0.06889915466308594, -0.0663442611694336, -0.06378936767578125, -0.061234474182128906, -0.05867958068847656, -0.05612468719482422, -0.053569793701171875, -0.05101490020751953, -0.04846000671386719, -0.045905113220214844, -0.0433502197265625, -0.040795326232910156, -0.03824043273925781, -0.03568553924560547, -0.033130645751953125, -0.03057575225830078, -0.028020858764648438, -0.025465965270996094, -0.02291107177734375, -0.020356178283691406, -0.017801284790039062, -0.015246391296386719, -0.012691497802734375, -0.010136604309082031, -0.0075817108154296875, -0.005026817321777344, -0.002471923828125, 8.296966552734375e-05, 0.0026378631591796875, 0.005192756652832031, 0.007747650146484375, 0.010302543640136719, 0.012857437133789062, 0.015412330627441406, 0.01796722412109375, 0.020522117614746094, 0.023077011108398438, 0.02563190460205078, 0.028186798095703125, 0.03074169158935547, 0.03329658508300781, 0.035851478576660156, 0.0384063720703125, 0.040961265563964844, 0.04351615905761719, 0.04607105255126953, 0.048625946044921875, 0.05118083953857422, 0.05373573303222656, 0.056290626525878906, 0.05884552001953125, 0.061400413513183594, 0.06395530700683594, 0.06651020050048828, 0.06906509399414062, 0.07161998748779297, 0.07417488098144531, 0.07672977447509766, 0.07928466796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 6.0, 8.0, 9.0, 14.0, 12.0, 22.0, 40.0, 69.0, 117.0, 196.0, 429.0, 1185.0, 3903.0, 29586.0, 4108129.0, 43470.0, 4793.0, 1286.0, 465.0, 209.0, 122.0, 73.0, 38.0, 29.0, 31.0, 7.0, 13.0, 9.0, 4.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6835479736328125, -0.650299072265625, -0.6170501708984375, -0.58380126953125, -0.5505523681640625, -0.517303466796875, -0.4840545654296875, -0.4508056640625, -0.4175567626953125, -0.384307861328125, -0.3510589599609375, -0.31781005859375, -0.2845611572265625, -0.251312255859375, -0.2180633544921875, -0.184814453125, -0.1515655517578125, -0.118316650390625, -0.0850677490234375, -0.05181884765625, -0.0185699462890625, 0.014678955078125, 0.0479278564453125, 0.0811767578125, 0.1144256591796875, 0.147674560546875, 0.1809234619140625, 0.21417236328125, 0.2474212646484375, 0.280670166015625, 0.3139190673828125, 0.34716796875, 0.3804168701171875, 0.413665771484375, 0.4469146728515625, 0.48016357421875, 0.5134124755859375, 0.546661376953125, 0.5799102783203125, 0.6131591796875, 0.6464080810546875, 0.679656982421875, 0.7129058837890625, 0.74615478515625, 0.7794036865234375, 0.812652587890625, 0.8459014892578125, 0.879150390625, 0.9123992919921875, 0.945648193359375, 0.9788970947265625, 1.01214599609375, 1.0453948974609375, 1.078643798828125, 1.1118927001953125, 1.1451416015625, 1.1783905029296875, 1.211639404296875, 1.2448883056640625, 1.27813720703125, 1.3113861083984375, 1.344635009765625, 1.3778839111328125, 1.4111328125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 8.0, 11.0, 8.0, 22.0, 36.0, 93.0, 620.0, 2961.0, 176.0, 73.0, 25.0, 17.0, 4.0, 7.0, 7.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.14108848571777344, -0.13239669799804688, -0.12370491027832031, -0.11501312255859375, -0.10632133483886719, -0.09762954711914062, -0.08893775939941406, -0.0802459716796875, -0.07155418395996094, -0.06286239624023438, -0.05417060852050781, -0.04547882080078125, -0.03678703308105469, -0.028095245361328125, -0.019403457641601562, -0.010711669921875, -0.0020198822021484375, 0.006671905517578125, 0.015363693237304688, 0.02405548095703125, 0.03274726867675781, 0.041439056396484375, 0.05013084411621094, 0.0588226318359375, 0.06751441955566406, 0.07620620727539062, 0.08489799499511719, 0.09358978271484375, 0.10228157043457031, 0.11097335815429688, 0.11966514587402344, 0.12835693359375, 0.13704872131347656, 0.14574050903320312, 0.1544322967529297, 0.16312408447265625, 0.1718158721923828, 0.18050765991210938, 0.18919944763183594, 0.1978912353515625, 0.20658302307128906, 0.21527481079101562, 0.2239665985107422, 0.23265838623046875, 0.2413501739501953, 0.2500419616699219, 0.25873374938964844, 0.267425537109375, 0.27611732482910156, 0.2848091125488281, 0.2935009002685547, 0.30219268798828125, 0.3108844757080078, 0.3195762634277344, 0.32826805114746094, 0.3369598388671875, 0.34565162658691406, 0.3543434143066406, 0.3630352020263672, 0.37172698974609375, 0.3804187774658203, 0.3891105651855469, 0.39780235290527344, 0.406494140625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 9.0, 7.0, 23.0, 35.0, 101.0, 168.0, 238.0, 198.0, 114.0, 46.0, 32.0, 12.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8871736526489258, -0.8499359488487244, -0.8126981854438782, -0.7754604816436768, -0.7382227182388306, -0.7009850144386292, -0.6637473106384277, -0.6265095472335815, -0.5892717838287354, -0.5520340800285339, -0.5147963166236877, -0.47755861282348633, -0.44032084941864014, -0.4030831456184387, -0.3658454120159149, -0.3286076784133911, -0.2913699746131897, -0.2541322410106659, -0.2168945074081421, -0.17965678870677948, -0.14241905510425568, -0.10518132150173187, -0.06794360280036926, -0.03070586919784546, 0.006531864404678345, 0.04376959428191185, 0.08100732415914536, 0.11824505031108856, 0.15548278391361237, 0.19272051751613617, 0.22995823621749878, 0.2671959698200226, 0.3044337034225464, 0.3416714370250702, 0.378909170627594, 0.4161468744277954, 0.4533846378326416, 0.490622341632843, 0.5278600454330444, 0.5650978088378906, 0.6023355722427368, 0.6395732760429382, 0.6768110394477844, 0.7140487432479858, 0.751286506652832, 0.7885242104530334, 0.8257619142532349, 0.862999677658081, 0.9002373814582825, 0.9374750852584839, 0.9747128486633301, 1.0119506120681763, 1.049188256263733, 1.086426019668579, 1.1236637830734253, 1.1609015464782715, 1.1981391906738281, 1.2353769540786743, 1.272614598274231, 1.3098523616790771, 1.3470901250839233, 1.3843278884887695, 1.4215655326843262, 1.4588032960891724, 1.4960410594940186]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 13.0, 18.0, 28.0, 37.0, 67.0, 100.0, 97.0, 118.0, 122.0, 122.0, 86.0, 83.0, 53.0, 14.0, 22.0, 9.0, 9.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8376607894897461, -0.8067715764045715, -0.775882363319397, -0.7449931502342224, -0.7141039371490479, -0.6832147240638733, -0.6523255109786987, -0.621436357498169, -0.5905470848083496, -0.559657871723175, -0.5287686586380005, -0.4978794455528259, -0.46699023246765137, -0.4361010193824768, -0.40521183609962463, -0.3743226230144501, -0.3434334397315979, -0.31254422664642334, -0.2816550135612488, -0.2507658004760742, -0.21987660229206085, -0.1889873892068863, -0.15809819102287292, -0.12720897793769836, -0.0963197648525238, -0.06543055176734924, -0.03454134613275528, -0.003652140498161316, 0.027237072587013245, 0.058126285672187805, 0.08901548385620117, 0.11990469694137573, 0.1507939100265503, 0.18168312311172485, 0.21257233619689941, 0.24346153438091278, 0.27435076236724854, 0.3052399754524231, 0.33612915873527527, 0.36701837182044983, 0.3979075849056244, 0.42879679799079895, 0.4596860110759735, 0.4905751943588257, 0.5214644074440002, 0.5523536205291748, 0.5832428336143494, 0.6141320466995239, 0.6450212597846985, 0.675910472869873, 0.7067996859550476, 0.7376888990402222, 0.7685781121253967, 0.7994673252105713, 0.8303564786911011, 0.8612457513809204, 0.8921349048614502, 0.9230241179466248, 0.9539133310317993, 0.9848025441169739, 1.0156917572021484, 1.0465809106826782, 1.0774701833724976, 1.1083593368530273, 1.1392486095428467]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 5.0, 6.0, 10.0, 11.0, 17.0, 15.0, 25.0, 30.0, 67.0, 85.0, 132.0, 207.0, 366.0, 823.0, 1699.0, 4920.0, 17583.0, 81896.0, 395745.0, 425146.0, 91235.0, 19479.0, 5250.0, 1937.0, 790.0, 413.0, 227.0, 139.0, 86.0, 59.0, 39.0, 41.0, 15.0, 14.0, 11.0, 7.0, 4.0, 4.0, 8.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2917976379394531, -0.28208160400390625, -0.2723655700683594, -0.2626495361328125, -0.2529335021972656, -0.24321746826171875, -0.23350143432617188, -0.223785400390625, -0.21406936645507812, -0.20435333251953125, -0.19463729858398438, -0.1849212646484375, -0.17520523071289062, -0.16548919677734375, -0.15577316284179688, -0.14605712890625, -0.13634109497070312, -0.12662506103515625, -0.11690902709960938, -0.1071929931640625, -0.09747695922851562, -0.08776092529296875, -0.07804489135742188, -0.068328857421875, -0.058612823486328125, -0.04889678955078125, -0.039180755615234375, -0.0294647216796875, -0.019748687744140625, -0.01003265380859375, -0.000316619873046875, 0.0093994140625, 0.019115447998046875, 0.02883148193359375, 0.038547515869140625, 0.0482635498046875, 0.057979583740234375, 0.06769561767578125, 0.07741165161132812, 0.087127685546875, 0.09684371948242188, 0.10655975341796875, 0.11627578735351562, 0.1259918212890625, 0.13570785522460938, 0.14542388916015625, 0.15513992309570312, 0.16485595703125, 0.17457199096679688, 0.18428802490234375, 0.19400405883789062, 0.2037200927734375, 0.21343612670898438, 0.22315216064453125, 0.23286819458007812, 0.242584228515625, 0.2523002624511719, 0.26201629638671875, 0.2717323303222656, 0.2814483642578125, 0.2911643981933594, 0.30088043212890625, 0.3105964660644531, 0.3203125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 5.0, 14.0, 7.0, 20.0, 21.0, 27.0, 26.0, 41.0, 34.0, 52.0, 48.0, 46.0, 69.0, 60.0, 63.0, 70.0, 57.0, 49.0, 48.0, 58.0, 42.0, 28.0, 34.0, 22.0, 17.0, 9.0, 13.0, 6.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0859375, -0.08335208892822266, -0.08076667785644531, -0.07818126678466797, -0.07559585571289062, -0.07301044464111328, -0.07042503356933594, -0.0678396224975586, -0.06525421142578125, -0.0626688003540039, -0.06008338928222656, -0.05749797821044922, -0.054912567138671875, -0.05232715606689453, -0.04974174499511719, -0.047156333923339844, -0.0445709228515625, -0.041985511779785156, -0.03940010070800781, -0.03681468963623047, -0.034229278564453125, -0.03164386749267578, -0.029058456420898438, -0.026473045349121094, -0.02388763427734375, -0.021302223205566406, -0.018716812133789062, -0.01613140106201172, -0.013545989990234375, -0.010960578918457031, -0.008375167846679688, -0.005789756774902344, -0.003204345703125, -0.0006189346313476562, 0.0019664764404296875, 0.004551887512207031, 0.007137298583984375, 0.009722709655761719, 0.012308120727539062, 0.014893531799316406, 0.01747894287109375, 0.020064353942871094, 0.022649765014648438, 0.02523517608642578, 0.027820587158203125, 0.03040599822998047, 0.03299140930175781, 0.035576820373535156, 0.0381622314453125, 0.040747642517089844, 0.04333305358886719, 0.04591846466064453, 0.048503875732421875, 0.05108928680419922, 0.05367469787597656, 0.056260108947753906, 0.05884552001953125, 0.061430931091308594, 0.06401634216308594, 0.06660175323486328, 0.06918716430664062, 0.07177257537841797, 0.07435798645019531, 0.07694339752197266, 0.07952880859375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 3.0, 15.0, 11.0, 19.0, 25.0, 43.0, 65.0, 111.0, 164.0, 357.0, 796.0, 2699.0, 12765.0, 85982.0, 533400.0, 353637.0, 47423.0, 7948.0, 1813.0, 618.0, 266.0, 153.0, 67.0, 56.0, 33.0, 24.0, 12.0, 13.0, 12.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2298583984375, -0.2206096649169922, -0.21136093139648438, -0.20211219787597656, -0.19286346435546875, -0.18361473083496094, -0.17436599731445312, -0.1651172637939453, -0.1558685302734375, -0.1466197967529297, -0.13737106323242188, -0.12812232971191406, -0.11887359619140625, -0.10962486267089844, -0.10037612915039062, -0.09112739562988281, -0.081878662109375, -0.07262992858886719, -0.06338119506835938, -0.05413246154785156, -0.04488372802734375, -0.03563499450683594, -0.026386260986328125, -0.017137527465820312, -0.0078887939453125, 0.0013599395751953125, 0.010608673095703125, 0.019857406616210938, 0.02910614013671875, 0.03835487365722656, 0.047603607177734375, 0.05685234069824219, 0.06610107421875, 0.07534980773925781, 0.08459854125976562, 0.09384727478027344, 0.10309600830078125, 0.11234474182128906, 0.12159347534179688, 0.1308422088623047, 0.1400909423828125, 0.1493396759033203, 0.15858840942382812, 0.16783714294433594, 0.17708587646484375, 0.18633460998535156, 0.19558334350585938, 0.2048320770263672, 0.214080810546875, 0.2233295440673828, 0.23257827758789062, 0.24182701110839844, 0.25107574462890625, 0.26032447814941406, 0.2695732116699219, 0.2788219451904297, 0.2880706787109375, 0.2973194122314453, 0.3065681457519531, 0.31581687927246094, 0.32506561279296875, 0.33431434631347656, 0.3435630798339844, 0.3528118133544922, 0.362060546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 10.0, 1.0, 3.0, 5.0, 10.0, 5.0, 11.0, 16.0, 20.0, 16.0, 25.0, 20.0, 25.0, 26.0, 27.0, 31.0, 33.0, 38.0, 25.0, 30.0, 44.0, 41.0, 34.0, 42.0, 49.0, 41.0, 35.0, 31.0, 37.0, 40.0, 40.0, 22.0, 26.0, 31.0, 18.0, 17.0, 14.0, 11.0, 11.0, 9.0, 5.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2371826171875, -0.23010635375976562, -0.22303009033203125, -0.21595382690429688, -0.2088775634765625, -0.20180130004882812, -0.19472503662109375, -0.18764877319335938, -0.180572509765625, -0.17349624633789062, -0.16641998291015625, -0.15934371948242188, -0.1522674560546875, -0.14519119262695312, -0.13811492919921875, -0.13103866577148438, -0.12396240234375, -0.11688613891601562, -0.10980987548828125, -0.10273361206054688, -0.0956573486328125, -0.08858108520507812, -0.08150482177734375, -0.07442855834960938, -0.067352294921875, -0.060276031494140625, -0.05319976806640625, -0.046123504638671875, -0.0390472412109375, -0.031970977783203125, -0.02489471435546875, -0.017818450927734375, -0.0107421875, -0.003665924072265625, 0.00341033935546875, 0.010486602783203125, 0.0175628662109375, 0.024639129638671875, 0.03171539306640625, 0.038791656494140625, 0.045867919921875, 0.052944183349609375, 0.06002044677734375, 0.06709671020507812, 0.0741729736328125, 0.08124923706054688, 0.08832550048828125, 0.09540176391601562, 0.10247802734375, 0.10955429077148438, 0.11663055419921875, 0.12370681762695312, 0.1307830810546875, 0.13785934448242188, 0.14493560791015625, 0.15201187133789062, 0.159088134765625, 0.16616439819335938, 0.17324066162109375, 0.18031692504882812, 0.1873931884765625, 0.19446945190429688, 0.20154571533203125, 0.20862197875976562, 0.2156982421875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 5.0, 9.0, 9.0, 6.0, 20.0, 25.0, 32.0, 55.0, 76.0, 116.0, 206.0, 369.0, 578.0, 1290.0, 2899.0, 7551.0, 24585.0, 111474.0, 520043.0, 301048.0, 54813.0, 14152.0, 5018.0, 2040.0, 892.0, 473.0, 285.0, 175.0, 104.0, 57.0, 40.0, 31.0, 29.0, 13.0, 7.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09991455078125, -0.09644317626953125, -0.0929718017578125, -0.08950042724609375, -0.086029052734375, -0.08255767822265625, -0.0790863037109375, -0.07561492919921875, -0.0721435546875, -0.06867218017578125, -0.0652008056640625, -0.06172943115234375, -0.058258056640625, -0.05478668212890625, -0.0513153076171875, -0.04784393310546875, -0.04437255859375, -0.04090118408203125, -0.0374298095703125, -0.03395843505859375, -0.030487060546875, -0.02701568603515625, -0.0235443115234375, -0.02007293701171875, -0.0166015625, -0.01313018798828125, -0.0096588134765625, -0.00618743896484375, -0.002716064453125, 0.00075531005859375, 0.0042266845703125, 0.00769805908203125, 0.01116943359375, 0.01464080810546875, 0.0181121826171875, 0.02158355712890625, 0.025054931640625, 0.02852630615234375, 0.0319976806640625, 0.03546905517578125, 0.0389404296875, 0.04241180419921875, 0.0458831787109375, 0.04935455322265625, 0.052825927734375, 0.05629730224609375, 0.0597686767578125, 0.06324005126953125, 0.06671142578125, 0.07018280029296875, 0.0736541748046875, 0.07712554931640625, 0.080596923828125, 0.08406829833984375, 0.0875396728515625, 0.09101104736328125, 0.094482421875, 0.09795379638671875, 0.1014251708984375, 0.10489654541015625, 0.108367919921875, 0.11183929443359375, 0.1153106689453125, 0.11878204345703125, 0.12225341796875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 5.0, 8.0, 5.0, 12.0, 11.0, 26.0, 22.0, 31.0, 44.0, 52.0, 71.0, 78.0, 71.0, 76.0, 120.0, 61.0, 70.0, 34.0, 43.0, 36.0, 22.0, 22.0, 10.0, 12.0, 13.0, 9.0, 5.0, 4.0, 4.0, 1.0, 6.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.913309097290039e-05, -1.8524006009101868e-05, -1.7914921045303345e-05, -1.7305836081504822e-05, -1.66967511177063e-05, -1.6087666153907776e-05, -1.5478581190109253e-05, -1.486949622631073e-05, -1.4260411262512207e-05, -1.3651326298713684e-05, -1.3042241334915161e-05, -1.2433156371116638e-05, -1.1824071407318115e-05, -1.1214986443519592e-05, -1.060590147972107e-05, -9.996816515922546e-06, -9.387731552124023e-06, -8.7786465883255e-06, -8.169561624526978e-06, -7.560476660728455e-06, -6.951391696929932e-06, -6.342306733131409e-06, -5.733221769332886e-06, -5.124136805534363e-06, -4.51505184173584e-06, -3.905966877937317e-06, -3.296881914138794e-06, -2.687796950340271e-06, -2.078711986541748e-06, -1.469627022743225e-06, -8.605420589447021e-07, -2.514570951461792e-07, 3.5762786865234375e-07, 9.667128324508667e-07, 1.5757977962493896e-06, 2.1848827600479126e-06, 2.7939677238464355e-06, 3.4030526876449585e-06, 4.0121376514434814e-06, 4.621222615242004e-06, 5.230307579040527e-06, 5.83939254283905e-06, 6.448477506637573e-06, 7.057562470436096e-06, 7.666647434234619e-06, 8.275732398033142e-06, 8.884817361831665e-06, 9.493902325630188e-06, 1.0102987289428711e-05, 1.0712072253227234e-05, 1.1321157217025757e-05, 1.193024218082428e-05, 1.2539327144622803e-05, 1.3148412108421326e-05, 1.3757497072219849e-05, 1.4366582036018372e-05, 1.4975666999816895e-05, 1.5584751963615417e-05, 1.619383692741394e-05, 1.6802921891212463e-05, 1.7412006855010986e-05, 1.802109181880951e-05, 1.8630176782608032e-05, 1.9239261746406555e-05, 1.9848346710205078e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 5.0, 15.0, 25.0, 40.0, 70.0, 146.0, 333.0, 1167.0, 5350.0, 46960.0, 723340.0, 251736.0, 15699.0, 2536.0, 673.0, 237.0, 94.0, 62.0, 22.0, 18.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1968994140625, -0.18926048278808594, -0.18162155151367188, -0.1739826202392578, -0.16634368896484375, -0.1587047576904297, -0.15106582641601562, -0.14342689514160156, -0.1357879638671875, -0.12814903259277344, -0.12051010131835938, -0.11287117004394531, -0.10523223876953125, -0.09759330749511719, -0.08995437622070312, -0.08231544494628906, -0.074676513671875, -0.06703758239746094, -0.059398651123046875, -0.05175971984863281, -0.04412078857421875, -0.03648185729980469, -0.028842926025390625, -0.021203994750976562, -0.0135650634765625, -0.0059261322021484375, 0.001712799072265625, 0.009351730346679688, 0.01699066162109375, 0.024629592895507812, 0.032268524169921875, 0.03990745544433594, 0.04754638671875, 0.05518531799316406, 0.06282424926757812, 0.07046318054199219, 0.07810211181640625, 0.08574104309082031, 0.09337997436523438, 0.10101890563964844, 0.1086578369140625, 0.11629676818847656, 0.12393569946289062, 0.1315746307373047, 0.13921356201171875, 0.1468524932861328, 0.15449142456054688, 0.16213035583496094, 0.169769287109375, 0.17740821838378906, 0.18504714965820312, 0.1926860809326172, 0.20032501220703125, 0.2079639434814453, 0.21560287475585938, 0.22324180603027344, 0.2308807373046875, 0.23851966857910156, 0.24615859985351562, 0.2537975311279297, 0.26143646240234375, 0.2690753936767578, 0.2767143249511719, 0.28435325622558594, 0.2919921875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 6.0, 7.0, 17.0, 14.0, 24.0, 43.0, 53.0, 67.0, 83.0, 102.0, 127.0, 101.0, 103.0, 74.0, 61.0, 38.0, 19.0, 15.0, 25.0, 10.0, 7.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10638427734375, -0.10167789459228516, -0.09697151184082031, -0.09226512908935547, -0.08755874633789062, -0.08285236358642578, -0.07814598083496094, -0.0734395980834961, -0.06873321533203125, -0.0640268325805664, -0.05932044982910156, -0.05461406707763672, -0.049907684326171875, -0.04520130157470703, -0.04049491882324219, -0.035788536071777344, -0.0310821533203125, -0.026375770568847656, -0.021669387817382812, -0.01696300506591797, -0.012256622314453125, -0.007550239562988281, -0.0028438568115234375, 0.0018625259399414062, 0.00656890869140625, 0.011275291442871094, 0.015981674194335938, 0.02068805694580078, 0.025394439697265625, 0.03010082244873047, 0.03480720520019531, 0.039513587951660156, 0.044219970703125, 0.048926353454589844, 0.05363273620605469, 0.05833911895751953, 0.06304550170898438, 0.06775188446044922, 0.07245826721191406, 0.0771646499633789, 0.08187103271484375, 0.0865774154663086, 0.09128379821777344, 0.09599018096923828, 0.10069656372070312, 0.10540294647216797, 0.11010932922363281, 0.11481571197509766, 0.1195220947265625, 0.12422847747802734, 0.1289348602294922, 0.13364124298095703, 0.13834762573242188, 0.14305400848388672, 0.14776039123535156, 0.1524667739868164, 0.15717315673828125, 0.1618795394897461, 0.16658592224121094, 0.17129230499267578, 0.17599868774414062, 0.18070507049560547, 0.1854114532470703, 0.19011783599853516, 0.19482421875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 10.0, 13.0, 44.0, 91.0, 162.0, 246.0, 240.0, 123.0, 53.0, 22.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1745418310165405, -1.0743021965026855, -0.9740626215934753, -0.8738230466842651, -0.7735834121704102, -0.6733437776565552, -0.573104202747345, -0.47286462783813477, -0.3726249933242798, -0.2723853886127472, -0.1721457839012146, -0.071906179189682, 0.028333425521850586, 0.12857306003570557, 0.22881263494491577, 0.329052209854126, 0.42929184436798096, 0.5295314788818359, 0.6297710537910461, 0.7300106287002563, 0.8302502632141113, 0.9304898977279663, 1.0307295322418213, 1.1309690475463867, 1.2312086820602417, 1.3314483165740967, 1.431687831878662, 1.531927466392517, 1.632167100906372, 1.732406735420227, 1.832646369934082, 1.9328858852386475, 2.033125400543213, 2.1333649158477783, 2.233604669570923, 2.3338441848754883, 2.434083938598633, 2.5343234539031982, 2.6345629692077637, 2.734802722930908, 2.8350422382354736, 2.935281753540039, 3.0355215072631836, 3.135761022567749, 3.2360005378723145, 3.336240291595459, 3.4364798069000244, 3.53671932220459, 3.6369590759277344, 3.7371985912323, 3.8374383449554443, 3.9376778602600098, 4.037917613983154, 4.138156890869141, 4.238396644592285, 4.33863639831543, 4.438876152038574, 4.539115905761719, 4.639355182647705, 4.73959493637085, 4.839834690093994, 4.9400739669799805, 5.040313720703125, 5.1405534744262695, 5.240792751312256]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 9.0, 7.0, 15.0, 9.0, 18.0, 18.0, 21.0, 25.0, 28.0, 31.0, 39.0, 38.0, 45.0, 52.0, 43.0, 46.0, 43.0, 54.0, 48.0, 46.0, 49.0, 38.0, 40.0, 27.0, 37.0, 29.0, 26.0, 12.0, 17.0, 14.0, 18.0, 10.0, 13.0, 12.0, 9.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3225250244140625, -1.2798298597335815, -1.2371348142623901, -1.1944396495819092, -1.1517446041107178, -1.1090494394302368, -1.0663542747497559, -1.0236592292785645, -0.9809641242027283, -0.9382690191268921, -0.8955739140510559, -0.8528788089752197, -0.8101836442947388, -0.7674885988235474, -0.7247934341430664, -0.6820983290672302, -0.639403223991394, -0.5967081189155579, -0.5540130138397217, -0.5113178491592407, -0.46862277388572693, -0.42592766880989075, -0.3832325339317322, -0.340537428855896, -0.2978423237800598, -0.25514721870422363, -0.21245209872722626, -0.16975697875022888, -0.1270618736743927, -0.08436676859855652, -0.04167163372039795, 0.0010234713554382324, 0.04371845722198486, 0.08641356974840164, 0.12910868227481842, 0.1718038022518158, 0.21449890732765198, 0.25719401240348816, 0.29988914728164673, 0.3425842523574829, 0.3852793574333191, 0.4279744625091553, 0.47066956758499146, 0.5133646726608276, 0.5560598373413086, 0.5987548828125, 0.641450047492981, 0.6841451525688171, 0.7268402576446533, 0.7695353627204895, 0.8122304677963257, 0.8549256324768066, 0.897620677947998, 0.940315842628479, 0.9830109477043152, 1.0257060527801514, 1.0684010982513428, 1.1110962629318237, 1.1537913084030151, 1.196486473083496, 1.2391815185546875, 1.2818766832351685, 1.3245718479156494, 1.3672668933868408, 1.4099620580673218]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 5.0, 4.0, 12.0, 10.0, 19.0, 27.0, 30.0, 61.0, 121.0, 168.0, 427.0, 1306.0, 6014.0, 152301.0, 4017299.0, 13313.0, 2066.0, 586.0, 240.0, 116.0, 53.0, 32.0, 27.0, 14.0, 12.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0947265625, -1.067474365234375, -1.04022216796875, -1.012969970703125, -0.9857177734375, -0.958465576171875, -0.93121337890625, -0.903961181640625, -0.876708984375, -0.849456787109375, -0.82220458984375, -0.794952392578125, -0.7677001953125, -0.740447998046875, -0.71319580078125, -0.685943603515625, -0.65869140625, -0.631439208984375, -0.60418701171875, -0.576934814453125, -0.5496826171875, -0.522430419921875, -0.49517822265625, -0.467926025390625, -0.440673828125, -0.413421630859375, -0.38616943359375, -0.358917236328125, -0.3316650390625, -0.304412841796875, -0.27716064453125, -0.249908447265625, -0.22265625, -0.195404052734375, -0.16815185546875, -0.140899658203125, -0.1136474609375, -0.086395263671875, -0.05914306640625, -0.031890869140625, -0.004638671875, 0.022613525390625, 0.04986572265625, 0.077117919921875, 0.1043701171875, 0.131622314453125, 0.15887451171875, 0.186126708984375, 0.21337890625, 0.240631103515625, 0.26788330078125, 0.295135498046875, 0.3223876953125, 0.349639892578125, 0.37689208984375, 0.404144287109375, 0.431396484375, 0.458648681640625, 0.48590087890625, 0.513153076171875, 0.5404052734375, 0.567657470703125, 0.59490966796875, 0.622161865234375, 0.6494140625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 13.0, 11.0, 11.0, 16.0, 19.0, 22.0, 35.0, 26.0, 43.0, 56.0, 51.0, 60.0, 59.0, 55.0, 78.0, 60.0, 55.0, 53.0, 46.0, 42.0, 46.0, 27.0, 35.0, 19.0, 16.0, 12.0, 13.0, 2.0, 10.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08319091796875, -0.08060169219970703, -0.07801246643066406, -0.0754232406616211, -0.07283401489257812, -0.07024478912353516, -0.06765556335449219, -0.06506633758544922, -0.06247711181640625, -0.05988788604736328, -0.05729866027832031, -0.054709434509277344, -0.052120208740234375, -0.049530982971191406, -0.04694175720214844, -0.04435253143310547, -0.0417633056640625, -0.03917407989501953, -0.03658485412597656, -0.033995628356933594, -0.031406402587890625, -0.028817176818847656, -0.026227951049804688, -0.02363872528076172, -0.02104949951171875, -0.01846027374267578, -0.015871047973632812, -0.013281822204589844, -0.010692596435546875, -0.008103370666503906, -0.0055141448974609375, -0.0029249191284179688, -0.000335693359375, 0.0022535324096679688, 0.0048427581787109375, 0.007431983947753906, 0.010021209716796875, 0.012610435485839844, 0.015199661254882812, 0.01778888702392578, 0.02037811279296875, 0.02296733856201172, 0.025556564331054688, 0.028145790100097656, 0.030735015869140625, 0.033324241638183594, 0.03591346740722656, 0.03850269317626953, 0.0410919189453125, 0.04368114471435547, 0.04627037048339844, 0.048859596252441406, 0.051448822021484375, 0.054038047790527344, 0.05662727355957031, 0.05921649932861328, 0.06180572509765625, 0.06439495086669922, 0.06698417663574219, 0.06957340240478516, 0.07216262817382812, 0.0747518539428711, 0.07734107971191406, 0.07993030548095703, 0.08251953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 3.0, 6.0, 11.0, 23.0, 24.0, 43.0, 52.0, 81.0, 109.0, 137.0, 308.0, 437.0, 757.0, 1605.0, 3371.0, 9289.0, 43585.0, 3955828.0, 152977.0, 15776.0, 5126.0, 2091.0, 1021.0, 650.0, 352.0, 218.0, 144.0, 80.0, 54.0, 36.0, 24.0, 12.0, 21.0, 14.0, 7.0, 4.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.701171875, -0.6830596923828125, -0.664947509765625, -0.6468353271484375, -0.62872314453125, -0.6106109619140625, -0.592498779296875, -0.5743865966796875, -0.5562744140625, -0.5381622314453125, -0.520050048828125, -0.5019378662109375, -0.48382568359375, -0.4657135009765625, -0.447601318359375, -0.4294891357421875, -0.411376953125, -0.3932647705078125, -0.375152587890625, -0.3570404052734375, -0.33892822265625, -0.3208160400390625, -0.302703857421875, -0.2845916748046875, -0.2664794921875, -0.2483673095703125, -0.230255126953125, -0.2121429443359375, -0.19403076171875, -0.1759185791015625, -0.157806396484375, -0.1396942138671875, -0.12158203125, -0.1034698486328125, -0.085357666015625, -0.0672454833984375, -0.04913330078125, -0.0310211181640625, -0.012908935546875, 0.0052032470703125, 0.0233154296875, 0.0414276123046875, 0.059539794921875, 0.0776519775390625, 0.09576416015625, 0.1138763427734375, 0.131988525390625, 0.1501007080078125, 0.168212890625, 0.1863250732421875, 0.204437255859375, 0.2225494384765625, 0.24066162109375, 0.2587738037109375, 0.276885986328125, 0.2949981689453125, 0.3131103515625, 0.3312225341796875, 0.349334716796875, 0.3674468994140625, 0.38555908203125, 0.4036712646484375, 0.421783447265625, 0.4398956298828125, 0.4580078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 12.0, 13.0, 17.0, 59.0, 84.0, 236.0, 2491.0, 813.0, 159.0, 62.0, 29.0, 20.0, 12.0, 12.0, 8.0, 8.0, 5.0, 6.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.26904296875, -0.262451171875, -0.255859375, -0.249267578125, -0.24267578125, -0.236083984375, -0.2294921875, -0.222900390625, -0.21630859375, -0.209716796875, -0.203125, -0.196533203125, -0.18994140625, -0.183349609375, -0.1767578125, -0.170166015625, -0.16357421875, -0.156982421875, -0.150390625, -0.143798828125, -0.13720703125, -0.130615234375, -0.1240234375, -0.117431640625, -0.11083984375, -0.104248046875, -0.09765625, -0.091064453125, -0.08447265625, -0.077880859375, -0.0712890625, -0.064697265625, -0.05810546875, -0.051513671875, -0.044921875, -0.038330078125, -0.03173828125, -0.025146484375, -0.0185546875, -0.011962890625, -0.00537109375, 0.001220703125, 0.0078125, 0.014404296875, 0.02099609375, 0.027587890625, 0.0341796875, 0.040771484375, 0.04736328125, 0.053955078125, 0.060546875, 0.067138671875, 0.07373046875, 0.080322265625, 0.0869140625, 0.093505859375, 0.10009765625, 0.106689453125, 0.11328125, 0.119873046875, 0.12646484375, 0.133056640625, 0.1396484375, 0.146240234375, 0.15283203125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 14.0, 20.0, 172.0, 498.0, 226.0, 59.0, 21.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.034205675125122, -2.931492805480957, -2.828780174255371, -2.726067304611206, -2.62335467338562, -2.520641803741455, -2.417929172515869, -2.315216302871704, -2.212503433227539, -2.109790563583374, -2.007077932357788, -1.904365062713623, -1.801652431488037, -1.698939561843872, -1.5962268114089966, -1.493514060974121, -1.3908014297485352, -1.2880886793136597, -1.1853759288787842, -1.0826630592346191, -0.9799503684043884, -0.8772376179695129, -0.7745248079299927, -0.6718120574951172, -0.5690993070602417, -0.4663865566253662, -0.36367377638816833, -0.26096099615097046, -0.15824824571609497, -0.05553549528121948, 0.04717731475830078, 0.14989006519317627, 0.25260257720947266, 0.35531532764434814, 0.458028107881546, 0.5607408881187439, 0.6634536385536194, 0.7661663889884949, 0.8688791990280151, 0.9715919494628906, 1.0743046998977661, 1.1770174503326416, 1.279730200767517, 1.3824429512023926, 1.4851558208465576, 1.5878684520721436, 1.6905813217163086, 1.793294072151184, 1.8960068225860596, 1.998719573020935, 2.1014323234558105, 2.2041451930999756, 2.3068578243255615, 2.4095706939697266, 2.5122833251953125, 2.6149961948394775, 2.7177090644836426, 2.8204219341278076, 2.9231345653533936, 3.0258474349975586, 3.1285600662231445, 3.2312729358673096, 3.3339858055114746, 3.4366984367370605, 3.5394110679626465]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 8.0, 11.0, 13.0, 33.0, 29.0, 37.0, 42.0, 48.0, 72.0, 68.0, 73.0, 82.0, 87.0, 86.0, 63.0, 58.0, 55.0, 41.0, 29.0, 19.0, 17.0, 12.0, 9.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8488069176673889, -0.8235843181610107, -0.7983616590499878, -0.7731390595436096, -0.7479164004325867, -0.7226938009262085, -0.6974711418151855, -0.6722485423088074, -0.6470259428024292, -0.621803343296051, -0.5965806841850281, -0.5713580846786499, -0.546135425567627, -0.5209128260612488, -0.4956901967525482, -0.47046756744384766, -0.4452449083328247, -0.42002227902412415, -0.3947996497154236, -0.3695770502090454, -0.34435439109802246, -0.3191317915916443, -0.2939091622829437, -0.26868653297424316, -0.2434639036655426, -0.21824127435684204, -0.19301864504814148, -0.1677960306406021, -0.14257340133190155, -0.11735077202320099, -0.09212815761566162, -0.06690552830696106, -0.04168295860290527, -0.01646033301949501, 0.008762292563915253, 0.03398491442203522, 0.05920754373073578, 0.08443017303943634, 0.10965278744697571, 0.13487541675567627, 0.16009804606437683, 0.1853206753730774, 0.21054330468177795, 0.23576591908931732, 0.2609885334968567, 0.28621119260787964, 0.3114337921142578, 0.3366564214229584, 0.36187905073165894, 0.3871016800403595, 0.41232430934906006, 0.43754690885543823, 0.4627695679664612, 0.48799216747283936, 0.5132148265838623, 0.5384374260902405, 0.5636600255966187, 0.5888826251029968, 0.6141052842140198, 0.639327883720398, 0.6645505428314209, 0.6897731423377991, 0.7149957418441772, 0.7402184009552002, 0.7654410600662231]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 3.0, 11.0, 9.0, 9.0, 25.0, 38.0, 34.0, 42.0, 75.0, 109.0, 213.0, 363.0, 591.0, 1340.0, 3338.0, 11255.0, 49129.0, 290181.0, 544385.0, 115295.0, 22049.0, 5950.0, 2010.0, 887.0, 459.0, 255.0, 170.0, 110.0, 58.0, 27.0, 28.0, 19.0, 21.0, 13.0, 7.0, 12.0, 7.0, 5.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.356689453125, -0.3465690612792969, -0.33644866943359375, -0.3263282775878906, -0.3162078857421875, -0.3060874938964844, -0.29596710205078125, -0.2858467102050781, -0.275726318359375, -0.2656059265136719, -0.25548553466796875, -0.24536514282226562, -0.2352447509765625, -0.22512435913085938, -0.21500396728515625, -0.20488357543945312, -0.19476318359375, -0.18464279174804688, -0.17452239990234375, -0.16440200805664062, -0.1542816162109375, -0.14416122436523438, -0.13404083251953125, -0.12392044067382812, -0.113800048828125, -0.10367965698242188, -0.09355926513671875, -0.08343887329101562, -0.0733184814453125, -0.06319808959960938, -0.05307769775390625, -0.042957305908203125, -0.0328369140625, -0.022716522216796875, -0.01259613037109375, -0.002475738525390625, 0.0076446533203125, 0.017765045166015625, 0.02788543701171875, 0.038005828857421875, 0.048126220703125, 0.058246612548828125, 0.06836700439453125, 0.07848739624023438, 0.0886077880859375, 0.09872817993164062, 0.10884857177734375, 0.11896896362304688, 0.12908935546875, 0.13920974731445312, 0.14933013916015625, 0.15945053100585938, 0.1695709228515625, 0.17969131469726562, 0.18981170654296875, 0.19993209838867188, 0.210052490234375, 0.22017288208007812, 0.23029327392578125, 0.24041366577148438, 0.2505340576171875, 0.2606544494628906, 0.27077484130859375, 0.2808952331542969, 0.291015625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 7.0, 12.0, 9.0, 14.0, 14.0, 20.0, 26.0, 27.0, 36.0, 46.0, 49.0, 48.0, 51.0, 52.0, 72.0, 58.0, 60.0, 69.0, 56.0, 41.0, 38.0, 33.0, 37.0, 28.0, 26.0, 19.0, 14.0, 12.0, 12.0, 8.0, 3.0, 3.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09100341796875, -0.08826446533203125, -0.0855255126953125, -0.08278656005859375, -0.080047607421875, -0.07730865478515625, -0.0745697021484375, -0.07183074951171875, -0.069091796875, -0.06635284423828125, -0.0636138916015625, -0.06087493896484375, -0.058135986328125, -0.05539703369140625, -0.0526580810546875, -0.04991912841796875, -0.04718017578125, -0.04444122314453125, -0.0417022705078125, -0.03896331787109375, -0.036224365234375, -0.03348541259765625, -0.0307464599609375, -0.02800750732421875, -0.0252685546875, -0.02252960205078125, -0.0197906494140625, -0.01705169677734375, -0.014312744140625, -0.01157379150390625, -0.0088348388671875, -0.00609588623046875, -0.00335693359375, -0.00061798095703125, 0.0021209716796875, 0.00485992431640625, 0.007598876953125, 0.01033782958984375, 0.0130767822265625, 0.01581573486328125, 0.0185546875, 0.02129364013671875, 0.0240325927734375, 0.02677154541015625, 0.029510498046875, 0.03224945068359375, 0.0349884033203125, 0.03772735595703125, 0.04046630859375, 0.04320526123046875, 0.0459442138671875, 0.04868316650390625, 0.051422119140625, 0.05416107177734375, 0.0569000244140625, 0.05963897705078125, 0.0623779296875, 0.06511688232421875, 0.0678558349609375, 0.07059478759765625, 0.073333740234375, 0.07607269287109375, 0.0788116455078125, 0.08155059814453125, 0.08428955078125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 15.0, 14.0, 17.0, 18.0, 24.0, 29.0, 44.0, 73.0, 73.0, 92.0, 186.0, 265.0, 437.0, 1119.0, 3064.0, 10153.0, 41262.0, 210457.0, 578007.0, 157716.0, 32428.0, 8353.0, 2545.0, 909.0, 456.0, 252.0, 152.0, 100.0, 71.0, 54.0, 32.0, 35.0, 23.0, 17.0, 14.0, 7.0, 8.0, 5.0, 6.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.258056640625, -0.25055885314941406, -0.24306106567382812, -0.2355632781982422, -0.22806549072265625, -0.2205677032470703, -0.21306991577148438, -0.20557212829589844, -0.1980743408203125, -0.19057655334472656, -0.18307876586914062, -0.1755809783935547, -0.16808319091796875, -0.1605854034423828, -0.15308761596679688, -0.14558982849121094, -0.138092041015625, -0.13059425354003906, -0.12309646606445312, -0.11559867858886719, -0.10810089111328125, -0.10060310363769531, -0.09310531616210938, -0.08560752868652344, -0.0781097412109375, -0.07061195373535156, -0.06311416625976562, -0.05561637878417969, -0.04811859130859375, -0.04062080383300781, -0.033123016357421875, -0.025625228881835938, -0.01812744140625, -0.010629653930664062, -0.003131866455078125, 0.0043659210205078125, 0.01186370849609375, 0.019361495971679688, 0.026859283447265625, 0.03435707092285156, 0.0418548583984375, 0.04935264587402344, 0.056850433349609375, 0.06434822082519531, 0.07184600830078125, 0.07934379577636719, 0.08684158325195312, 0.09433937072753906, 0.101837158203125, 0.10933494567871094, 0.11683273315429688, 0.12433052062988281, 0.13182830810546875, 0.1393260955810547, 0.14682388305664062, 0.15432167053222656, 0.1618194580078125, 0.16931724548339844, 0.17681503295898438, 0.1843128204345703, 0.19181060791015625, 0.1993083953857422, 0.20680618286132812, 0.21430397033691406, 0.2218017578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 1.0, 4.0, 0.0, 3.0, 11.0, 5.0, 8.0, 12.0, 7.0, 12.0, 16.0, 25.0, 15.0, 18.0, 26.0, 32.0, 31.0, 31.0, 43.0, 39.0, 41.0, 42.0, 45.0, 61.0, 39.0, 36.0, 42.0, 32.0, 41.0, 37.0, 23.0, 31.0, 24.0, 27.0, 30.0, 20.0, 16.0, 11.0, 14.0, 10.0, 8.0, 12.0, 5.0, 4.0, 3.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.250732421875, -0.24248123168945312, -0.23423004150390625, -0.22597885131835938, -0.2177276611328125, -0.20947647094726562, -0.20122528076171875, -0.19297409057617188, -0.184722900390625, -0.17647171020507812, -0.16822052001953125, -0.15996932983398438, -0.1517181396484375, -0.14346694946289062, -0.13521575927734375, -0.12696456909179688, -0.11871337890625, -0.11046218872070312, -0.10221099853515625, -0.09395980834960938, -0.0857086181640625, -0.07745742797851562, -0.06920623779296875, -0.060955047607421875, -0.052703857421875, -0.044452667236328125, -0.03620147705078125, -0.027950286865234375, -0.0196990966796875, -0.011447906494140625, -0.00319671630859375, 0.005054473876953125, 0.0133056640625, 0.021556854248046875, 0.02980804443359375, 0.038059234619140625, 0.0463104248046875, 0.054561614990234375, 0.06281280517578125, 0.07106399536132812, 0.079315185546875, 0.08756637573242188, 0.09581756591796875, 0.10406875610351562, 0.1123199462890625, 0.12057113647460938, 0.12882232666015625, 0.13707351684570312, 0.14532470703125, 0.15357589721679688, 0.16182708740234375, 0.17007827758789062, 0.1783294677734375, 0.18658065795898438, 0.19483184814453125, 0.20308303833007812, 0.211334228515625, 0.21958541870117188, 0.22783660888671875, 0.23608779907226562, 0.2443389892578125, 0.2525901794433594, 0.26084136962890625, 0.2690925598144531, 0.27734375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 3.0, 6.0, 5.0, 11.0, 14.0, 29.0, 31.0, 31.0, 78.0, 117.0, 151.0, 267.0, 377.0, 643.0, 1063.0, 1799.0, 3432.0, 7360.0, 17197.0, 51556.0, 244691.0, 538680.0, 124726.0, 32486.0, 12032.0, 5322.0, 2623.0, 1430.0, 873.0, 520.0, 341.0, 211.0, 137.0, 101.0, 62.0, 43.0, 28.0, 22.0, 19.0, 12.0, 6.0, 10.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.10595703125, -0.10295581817626953, -0.09995460510253906, -0.0969533920288086, -0.09395217895507812, -0.09095096588134766, -0.08794975280761719, -0.08494853973388672, -0.08194732666015625, -0.07894611358642578, -0.07594490051269531, -0.07294368743896484, -0.06994247436523438, -0.0669412612915039, -0.06394004821777344, -0.06093883514404297, -0.0579376220703125, -0.05493640899658203, -0.05193519592285156, -0.048933982849121094, -0.045932769775390625, -0.042931556701660156, -0.03993034362792969, -0.03692913055419922, -0.03392791748046875, -0.03092670440673828, -0.027925491333007812, -0.024924278259277344, -0.021923065185546875, -0.018921852111816406, -0.015920639038085938, -0.012919425964355469, -0.009918212890625, -0.006916999816894531, -0.0039157867431640625, -0.0009145736694335938, 0.002086639404296875, 0.005087852478027344, 0.008089065551757812, 0.011090278625488281, 0.01409149169921875, 0.01709270477294922, 0.020093917846679688, 0.023095130920410156, 0.026096343994140625, 0.029097557067871094, 0.03209877014160156, 0.03509998321533203, 0.0381011962890625, 0.04110240936279297, 0.04410362243652344, 0.047104835510253906, 0.050106048583984375, 0.053107261657714844, 0.05610847473144531, 0.05910968780517578, 0.06211090087890625, 0.06511211395263672, 0.06811332702636719, 0.07111454010009766, 0.07411575317382812, 0.0771169662475586, 0.08011817932128906, 0.08311939239501953, 0.08612060546875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 4.0, 10.0, 17.0, 15.0, 32.0, 55.0, 63.0, 134.0, 155.0, 167.0, 114.0, 84.0, 64.0, 31.0, 19.0, 14.0, 8.0, 12.0, 4.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.552436828613281e-05, -3.437977284193039e-05, -3.3235177397727966e-05, -3.209058195352554e-05, -3.094598650932312e-05, -2.9801391065120697e-05, -2.8656795620918274e-05, -2.751220017671585e-05, -2.6367604732513428e-05, -2.5223009288311005e-05, -2.407841384410858e-05, -2.293381839990616e-05, -2.1789222955703735e-05, -2.0644627511501312e-05, -1.950003206729889e-05, -1.8355436623096466e-05, -1.7210841178894043e-05, -1.606624573469162e-05, -1.4921650290489197e-05, -1.3777054846286774e-05, -1.263245940208435e-05, -1.1487863957881927e-05, -1.0343268513679504e-05, -9.198673069477081e-06, -8.054077625274658e-06, -6.909482181072235e-06, -5.764886736869812e-06, -4.620291292667389e-06, -3.475695848464966e-06, -2.3311004042625427e-06, -1.1865049600601196e-06, -4.190951585769653e-08, 1.1026859283447266e-06, 2.2472813725471497e-06, 3.3918768167495728e-06, 4.536472260951996e-06, 5.681067705154419e-06, 6.825663149356842e-06, 7.970258593559265e-06, 9.114854037761688e-06, 1.0259449481964111e-05, 1.1404044926166534e-05, 1.2548640370368958e-05, 1.369323581457138e-05, 1.4837831258773804e-05, 1.5982426702976227e-05, 1.712702214717865e-05, 1.8271617591381073e-05, 1.9416213035583496e-05, 2.056080847978592e-05, 2.1705403923988342e-05, 2.2849999368190765e-05, 2.399459481239319e-05, 2.513919025659561e-05, 2.6283785700798035e-05, 2.7428381145000458e-05, 2.857297658920288e-05, 2.9717572033405304e-05, 3.086216747760773e-05, 3.200676292181015e-05, 3.315135836601257e-05, 3.4295953810214996e-05, 3.544054925441742e-05, 3.658514469861984e-05, 3.7729740142822266e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 19.0, 22.0, 36.0, 38.0, 89.0, 125.0, 139.0, 274.0, 462.0, 915.0, 1740.0, 3760.0, 9538.0, 30020.0, 129772.0, 552407.0, 245828.0, 48920.0, 14202.0, 5287.0, 2221.0, 1152.0, 622.0, 383.0, 225.0, 123.0, 67.0, 49.0, 32.0, 24.0, 22.0, 14.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.108154296875, -0.1046295166015625, -0.101104736328125, -0.0975799560546875, -0.09405517578125, -0.0905303955078125, -0.087005615234375, -0.0834808349609375, -0.0799560546875, -0.0764312744140625, -0.072906494140625, -0.0693817138671875, -0.06585693359375, -0.0623321533203125, -0.058807373046875, -0.0552825927734375, -0.0517578125, -0.0482330322265625, -0.044708251953125, -0.0411834716796875, -0.03765869140625, -0.0341339111328125, -0.030609130859375, -0.0270843505859375, -0.0235595703125, -0.0200347900390625, -0.016510009765625, -0.0129852294921875, -0.00946044921875, -0.0059356689453125, -0.002410888671875, 0.0011138916015625, 0.004638671875, 0.0081634521484375, 0.011688232421875, 0.0152130126953125, 0.01873779296875, 0.0222625732421875, 0.025787353515625, 0.0293121337890625, 0.0328369140625, 0.0363616943359375, 0.039886474609375, 0.0434112548828125, 0.04693603515625, 0.0504608154296875, 0.053985595703125, 0.0575103759765625, 0.06103515625, 0.0645599365234375, 0.068084716796875, 0.0716094970703125, 0.07513427734375, 0.0786590576171875, 0.082183837890625, 0.0857086181640625, 0.0892333984375, 0.0927581787109375, 0.096282958984375, 0.0998077392578125, 0.10333251953125, 0.1068572998046875, 0.110382080078125, 0.1139068603515625, 0.117431640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 3.0, 1.0, 9.0, 5.0, 11.0, 9.0, 12.0, 22.0, 16.0, 16.0, 37.0, 39.0, 56.0, 51.0, 54.0, 68.0, 63.0, 79.0, 56.0, 68.0, 71.0, 49.0, 42.0, 24.0, 29.0, 24.0, 14.0, 14.0, 10.0, 7.0, 6.0, 13.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 6.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.0960693359375, -0.09334659576416016, -0.09062385559082031, -0.08790111541748047, -0.08517837524414062, -0.08245563507080078, -0.07973289489746094, -0.0770101547241211, -0.07428741455078125, -0.0715646743774414, -0.06884193420410156, -0.06611919403076172, -0.06339645385742188, -0.06067371368408203, -0.05795097351074219, -0.055228233337402344, -0.0525054931640625, -0.049782752990722656, -0.04706001281738281, -0.04433727264404297, -0.041614532470703125, -0.03889179229736328, -0.03616905212402344, -0.033446311950683594, -0.03072357177734375, -0.028000831604003906, -0.025278091430664062, -0.02255535125732422, -0.019832611083984375, -0.01710987091064453, -0.014387130737304688, -0.011664390563964844, -0.008941650390625, -0.006218910217285156, -0.0034961700439453125, -0.0007734298706054688, 0.001949310302734375, 0.004672050476074219, 0.0073947906494140625, 0.010117530822753906, 0.01284027099609375, 0.015563011169433594, 0.018285751342773438, 0.02100849151611328, 0.023731231689453125, 0.02645397186279297, 0.029176712036132812, 0.031899452209472656, 0.0346221923828125, 0.037344932556152344, 0.04006767272949219, 0.04279041290283203, 0.045513153076171875, 0.04823589324951172, 0.05095863342285156, 0.053681373596191406, 0.05640411376953125, 0.059126853942871094, 0.06184959411621094, 0.06457233428955078, 0.06729507446289062, 0.07001781463623047, 0.07274055480957031, 0.07546329498291016, 0.07818603515625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 21.0, 34.0, 58.0, 112.0, 184.0, 181.0, 155.0, 105.0, 60.0, 44.0, 20.0, 9.0, 10.0, 2.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185805320739746, -2.114001512527466, -2.0421977043151855, -1.9703940153121948, -1.8985902070999146, -1.8267865180969238, -1.7549827098846436, -1.6831789016723633, -1.611375093460083, -1.5395712852478027, -1.467767596244812, -1.3959637880325317, -1.3241599798202515, -1.2523562908172607, -1.1805524826049805, -1.1087486743927002, -1.0369449853897095, -0.965141236782074, -0.8933374285697937, -0.8215336799621582, -0.7497298717498779, -0.6779261231422424, -0.6061223745346069, -0.5343185663223267, -0.46251481771469116, -0.3907110393047333, -0.3189072608947754, -0.2471035122871399, -0.175299733877182, -0.10349595546722412, -0.03169220685958862, 0.04011160135269165, 0.11191534996032715, 0.18371912837028503, 0.2555229067802429, 0.3273266553878784, 0.3991304337978363, 0.4709342122077942, 0.5427379608154297, 0.61454176902771, 0.6863455176353455, 0.758149266242981, 0.8299530744552612, 0.9017568230628967, 0.9735605716705322, 1.0453643798828125, 1.1171681880950928, 1.188971996307373, 1.2607756853103638, 1.332579493522644, 1.4043831825256348, 1.476186990737915, 1.5479907989501953, 1.6197946071624756, 1.6915982961654663, 1.7634021043777466, 1.8352057933807373, 1.9070096015930176, 1.9788132905960083, 2.050617218017578, 2.1224207878112793, 2.1942245960235596, 2.26602840423584, 2.33783221244812, 2.4096360206604004]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 5.0, 6.0, 5.0, 11.0, 9.0, 10.0, 16.0, 17.0, 19.0, 21.0, 23.0, 21.0, 29.0, 23.0, 28.0, 25.0, 37.0, 34.0, 36.0, 49.0, 31.0, 38.0, 24.0, 34.0, 36.0, 39.0, 34.0, 32.0, 27.0, 29.0, 28.0, 33.0, 26.0, 25.0, 20.0, 16.0, 13.0, 21.0, 14.0, 8.0, 10.0, 9.0, 11.0, 6.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.2216308116912842, -1.1852636337280273, -1.1488964557647705, -1.1125292778015137, -1.0761620998382568, -1.039794921875, -1.0034277439117432, -0.9670606255531311, -0.9306934475898743, -0.8943262696266174, -0.8579590916633606, -0.8215919137001038, -0.7852247953414917, -0.7488576173782349, -0.712490439414978, -0.6761232614517212, -0.6397560834884644, -0.6033889055252075, -0.5670217275619507, -0.5306545495986938, -0.4942874014377594, -0.45792022347450256, -0.4215530753135681, -0.3851858973503113, -0.34881871938705444, -0.3124515414237976, -0.27608436346054077, -0.23971721529960632, -0.2033500373363495, -0.16698285937309265, -0.130615696310997, -0.09424853324890137, -0.05788135528564453, -0.021514184772968292, 0.014852985739707947, 0.051220156252384186, 0.08758732676506042, 0.12395450472831726, 0.1603216677904129, 0.19668883085250854, 0.23305600881576538, 0.2694231867790222, 0.30579036474227905, 0.3421575129032135, 0.37852469086647034, 0.4148918688297272, 0.4512590169906616, 0.48762619495391846, 0.5239933729171753, 0.5603605508804321, 0.596727728843689, 0.6330949068069458, 0.6694620847702026, 0.7058292627334595, 0.7421963810920715, 0.7785635590553284, 0.8149307370185852, 0.851297914981842, 0.8876650929450989, 0.9240322709083557, 0.9603993892669678, 0.9967665672302246, 1.0331337451934814, 1.0695009231567383, 1.1058681011199951]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 2.0, 4.0, 12.0, 20.0, 29.0, 40.0, 71.0, 106.0, 321.0, 3253.0, 4187343.0, 2501.0, 279.0, 139.0, 62.0, 37.0, 29.0, 14.0, 8.0, 5.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.208984375, -3.127655029296875, -3.04632568359375, -2.964996337890625, -2.8836669921875, -2.802337646484375, -2.72100830078125, -2.639678955078125, -2.558349609375, -2.477020263671875, -2.39569091796875, -2.314361572265625, -2.2330322265625, -2.151702880859375, -2.07037353515625, -1.989044189453125, -1.90771484375, -1.826385498046875, -1.74505615234375, -1.663726806640625, -1.5823974609375, -1.501068115234375, -1.41973876953125, -1.338409423828125, -1.257080078125, -1.175750732421875, -1.09442138671875, -1.013092041015625, -0.9317626953125, -0.850433349609375, -0.76910400390625, -0.687774658203125, -0.6064453125, -0.525115966796875, -0.44378662109375, -0.362457275390625, -0.2811279296875, -0.199798583984375, -0.11846923828125, -0.037139892578125, 0.044189453125, 0.125518798828125, 0.20684814453125, 0.288177490234375, 0.3695068359375, 0.450836181640625, 0.53216552734375, 0.613494873046875, 0.69482421875, 0.776153564453125, 0.85748291015625, 0.938812255859375, 1.0201416015625, 1.101470947265625, 1.18280029296875, 1.264129638671875, 1.345458984375, 1.426788330078125, 1.50811767578125, 1.589447021484375, 1.6707763671875, 1.752105712890625, 1.83343505859375, 1.914764404296875, 1.99609375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 12.0, 3.0, 9.0, 12.0, 16.0, 9.0, 24.0, 21.0, 26.0, 26.0, 27.0, 46.0, 41.0, 47.0, 60.0, 46.0, 52.0, 50.0, 64.0, 57.0, 42.0, 35.0, 34.0, 38.0, 30.0, 32.0, 31.0, 22.0, 20.0, 13.0, 18.0, 15.0, 8.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.082763671875, -0.0802011489868164, -0.07763862609863281, -0.07507610321044922, -0.07251358032226562, -0.06995105743408203, -0.06738853454589844, -0.06482601165771484, -0.06226348876953125, -0.059700965881347656, -0.05713844299316406, -0.05457592010498047, -0.052013397216796875, -0.04945087432861328, -0.04688835144042969, -0.044325828552246094, -0.0417633056640625, -0.039200782775878906, -0.03663825988769531, -0.03407573699951172, -0.031513214111328125, -0.02895069122314453, -0.026388168334960938, -0.023825645446777344, -0.02126312255859375, -0.018700599670410156, -0.016138076782226562, -0.013575553894042969, -0.011013031005859375, -0.008450508117675781, -0.0058879852294921875, -0.0033254623413085938, -0.000762939453125, 0.0017995834350585938, 0.0043621063232421875, 0.006924629211425781, 0.009487152099609375, 0.012049674987792969, 0.014612197875976562, 0.017174720764160156, 0.01973724365234375, 0.022299766540527344, 0.024862289428710938, 0.02742481231689453, 0.029987335205078125, 0.03254985809326172, 0.03511238098144531, 0.037674903869628906, 0.0402374267578125, 0.042799949645996094, 0.04536247253417969, 0.04792499542236328, 0.050487518310546875, 0.05305004119873047, 0.05561256408691406, 0.058175086975097656, 0.06073760986328125, 0.06330013275146484, 0.06586265563964844, 0.06842517852783203, 0.07098770141601562, 0.07355022430419922, 0.07611274719238281, 0.0786752700805664, 0.08123779296875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 5.0, 14.0, 17.0, 12.0, 13.0, 34.0, 39.0, 37.0, 43.0, 60.0, 76.0, 118.0, 237.0, 401.0, 765.0, 1658.0, 4018.0, 22375.0, 4144672.0, 13075.0, 3333.0, 1458.0, 759.0, 390.0, 213.0, 111.0, 70.0, 54.0, 34.0, 28.0, 34.0, 22.0, 24.0, 19.0, 15.0, 14.0, 5.0, 7.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.7958984375, -0.7746200561523438, -0.7533416748046875, -0.7320632934570312, -0.710784912109375, -0.6895065307617188, -0.6682281494140625, -0.6469497680664062, -0.62567138671875, -0.6043930053710938, -0.5831146240234375, -0.5618362426757812, -0.540557861328125, -0.5192794799804688, -0.4980010986328125, -0.47672271728515625, -0.4554443359375, -0.43416595458984375, -0.4128875732421875, -0.39160919189453125, -0.370330810546875, -0.34905242919921875, -0.3277740478515625, -0.30649566650390625, -0.28521728515625, -0.26393890380859375, -0.2426605224609375, -0.22138214111328125, -0.200103759765625, -0.17882537841796875, -0.1575469970703125, -0.13626861572265625, -0.114990234375, -0.09371185302734375, -0.0724334716796875, -0.05115509033203125, -0.029876708984375, -0.00859832763671875, 0.0126800537109375, 0.03395843505859375, 0.05523681640625, 0.07651519775390625, 0.0977935791015625, 0.11907196044921875, 0.140350341796875, 0.16162872314453125, 0.1829071044921875, 0.20418548583984375, 0.2254638671875, 0.24674224853515625, 0.2680206298828125, 0.28929901123046875, 0.310577392578125, 0.33185577392578125, 0.3531341552734375, 0.37441253662109375, 0.39569091796875, 0.41696929931640625, 0.4382476806640625, 0.45952606201171875, 0.480804443359375, 0.5020828247070312, 0.5233612060546875, 0.5446395874023438, 0.56591796875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 10.0, 57.0, 3723.0, 228.0, 28.0, 4.0, 7.0, 0.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.113525390625, -0.10912513732910156, -0.10472488403320312, -0.10032463073730469, -0.09592437744140625, -0.09152412414550781, -0.08712387084960938, -0.08272361755371094, -0.0783233642578125, -0.07392311096191406, -0.06952285766601562, -0.06512260437011719, -0.06072235107421875, -0.05632209777832031, -0.051921844482421875, -0.04752159118652344, -0.043121337890625, -0.03872108459472656, -0.034320831298828125, -0.029920578002929688, -0.02552032470703125, -0.021120071411132812, -0.016719818115234375, -0.012319564819335938, -0.0079193115234375, -0.0035190582275390625, 0.000881195068359375, 0.0052814483642578125, 0.00968170166015625, 0.014081954956054688, 0.018482208251953125, 0.022882461547851562, 0.02728271484375, 0.03168296813964844, 0.036083221435546875, 0.04048347473144531, 0.04488372802734375, 0.04928398132324219, 0.053684234619140625, 0.05808448791503906, 0.0624847412109375, 0.06688499450683594, 0.07128524780273438, 0.07568550109863281, 0.08008575439453125, 0.08448600769042969, 0.08888626098632812, 0.09328651428222656, 0.097686767578125, 0.10208702087402344, 0.10648727416992188, 0.11088752746582031, 0.11528778076171875, 0.11968803405761719, 0.12408828735351562, 0.12848854064941406, 0.1328887939453125, 0.13728904724121094, 0.14168930053710938, 0.1460895538330078, 0.15048980712890625, 0.1548900604248047, 0.15929031372070312, 0.16369056701660156, 0.1680908203125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 7.0, 20.0, 42.0, 156.0, 302.0, 245.0, 134.0, 63.0, 20.0, 10.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16086207330226898, -0.1400904804468155, -0.1193188726902008, -0.09854727983474731, -0.07777567952871323, -0.05700407922267914, -0.03623248636722565, -0.015460878610610962, 0.005310714244842529, 0.026082312688231468, 0.04685391113162041, 0.0676255077123642, 0.08839710801839828, 0.10916870832443237, 0.12994030117988586, 0.15071190893650055, 0.17148350179195404, 0.19225509464740753, 0.21302670240402222, 0.2337982952594757, 0.2545698881149292, 0.2753415107727051, 0.2961130738258362, 0.31688469648361206, 0.33765628933906555, 0.35842788219451904, 0.37919947504997253, 0.399971067905426, 0.4207426905632019, 0.4415142834186554, 0.4622858762741089, 0.48305749893188477, 0.5038290619850159, 0.5246006846427917, 0.5453722476959229, 0.5661438703536987, 0.5869154334068298, 0.6076870560646057, 0.6284586191177368, 0.6492302417755127, 0.6700018644332886, 0.6907734870910645, 0.7115450501441956, 0.7323166728019714, 0.7530882358551025, 0.7738598585128784, 0.7946314811706543, 0.8154030442237854, 0.8361746072769165, 0.8569462299346924, 0.8777177929878235, 0.8984894156455994, 0.9192609786987305, 0.9400326013565063, 0.9608042240142822, 0.9815757870674133, 1.002347469329834, 1.0231190919876099, 1.0438907146453857, 1.064662218093872, 1.085433840751648, 1.1062054634094238, 1.1269770860671997, 1.1477487087249756, 1.168520212173462]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 8.0, 7.0, 6.0, 14.0, 7.0, 21.0, 11.0, 21.0, 18.0, 22.0, 32.0, 24.0, 32.0, 30.0, 25.0, 24.0, 37.0, 49.0, 35.0, 45.0, 30.0, 38.0, 28.0, 35.0, 36.0, 37.0, 24.0, 28.0, 40.0, 32.0, 29.0, 26.0, 25.0, 18.0, 12.0, 15.0, 10.0, 9.0, 7.0, 8.0, 6.0, 6.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1327114701271057, -0.12841123342514038, -0.12411098182201385, -0.11981074512004852, -0.1155105009675026, -0.11121025681495667, -0.10691002011299133, -0.1026097759604454, -0.09830953180789948, -0.09400928765535355, -0.08970904350280762, -0.08540880680084229, -0.08110856264829636, -0.07680831849575043, -0.0725080817937851, -0.06820783764123917, -0.06390759348869324, -0.05960734933614731, -0.05530710890889168, -0.05100686848163605, -0.04670662432909012, -0.04240638017654419, -0.03810613974928856, -0.03380589932203293, -0.029505655169487, -0.02520541287958622, -0.02090517058968544, -0.01660492829978466, -0.01230468600988388, -0.008004443719983101, -0.003704201430082321, 0.0005960408598184586, 0.004896283149719238, 0.009196525439620018, 0.013496767729520798, 0.017797010019421577, 0.022097252309322357, 0.026397494599223137, 0.030697736889123917, 0.03499797731637955, 0.039298221468925476, 0.043598465621471405, 0.047898706048727036, 0.052198946475982666, 0.056499190628528595, 0.060799434781074524, 0.06509967148303986, 0.06939991563558578, 0.07370015978813171, 0.07800040394067764, 0.08230064809322357, 0.0866008847951889, 0.09090112894773483, 0.09520137310028076, 0.0995016098022461, 0.10380185395479202, 0.10810209810733795, 0.11240234225988388, 0.11670258641242981, 0.12100282311439514, 0.12530305981636047, 0.129603311419487, 0.13390354812145233, 0.13820379972457886, 0.1425040364265442]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 13.0, 10.0, 24.0, 25.0, 41.0, 74.0, 88.0, 156.0, 293.0, 598.0, 1433.0, 4141.0, 13487.0, 52724.0, 233126.0, 503730.0, 180668.0, 41263.0, 10720.0, 3473.0, 1224.0, 516.0, 292.0, 158.0, 97.0, 49.0, 41.0, 28.0, 11.0, 10.0, 11.0, 6.0, 7.0, 3.0, 4.0, 1.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.226318359375, -0.21862411499023438, -0.21092987060546875, -0.20323562622070312, -0.1955413818359375, -0.18784713745117188, -0.18015289306640625, -0.17245864868164062, -0.164764404296875, -0.15707015991210938, -0.14937591552734375, -0.14168167114257812, -0.1339874267578125, -0.12629318237304688, -0.11859893798828125, -0.11090469360351562, -0.10321044921875, -0.09551620483398438, -0.08782196044921875, -0.08012771606445312, -0.0724334716796875, -0.06473922729492188, -0.05704498291015625, -0.049350738525390625, -0.041656494140625, -0.033962249755859375, -0.02626800537109375, -0.018573760986328125, -0.0108795166015625, -0.003185272216796875, 0.00450897216796875, 0.012203216552734375, 0.0198974609375, 0.027591705322265625, 0.03528594970703125, 0.042980194091796875, 0.0506744384765625, 0.058368682861328125, 0.06606292724609375, 0.07375717163085938, 0.081451416015625, 0.08914566040039062, 0.09683990478515625, 0.10453414916992188, 0.1122283935546875, 0.11992263793945312, 0.12761688232421875, 0.13531112670898438, 0.14300537109375, 0.15069961547851562, 0.15839385986328125, 0.16608810424804688, 0.1737823486328125, 0.18147659301757812, 0.18917083740234375, 0.19686508178710938, 0.204559326171875, 0.21225357055664062, 0.21994781494140625, 0.22764205932617188, 0.2353363037109375, 0.24303054809570312, 0.25072479248046875, 0.2584190368652344, 0.26611328125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 13.0, 12.0, 13.0, 15.0, 20.0, 28.0, 26.0, 30.0, 26.0, 30.0, 49.0, 48.0, 42.0, 45.0, 57.0, 42.0, 40.0, 57.0, 51.0, 37.0, 54.0, 22.0, 28.0, 32.0, 29.0, 23.0, 10.0, 23.0, 17.0, 13.0, 17.0, 6.0, 6.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08172607421875, -0.07912349700927734, -0.07652091979980469, -0.07391834259033203, -0.07131576538085938, -0.06871318817138672, -0.06611061096191406, -0.0635080337524414, -0.06090545654296875, -0.058302879333496094, -0.05570030212402344, -0.05309772491455078, -0.050495147705078125, -0.04789257049560547, -0.04528999328613281, -0.042687416076660156, -0.0400848388671875, -0.037482261657714844, -0.03487968444824219, -0.03227710723876953, -0.029674530029296875, -0.02707195281982422, -0.024469375610351562, -0.021866798400878906, -0.01926422119140625, -0.016661643981933594, -0.014059066772460938, -0.011456489562988281, -0.008853912353515625, -0.006251335144042969, -0.0036487579345703125, -0.0010461807250976562, 0.001556396484375, 0.004158973693847656, 0.0067615509033203125, 0.009364128112792969, 0.011966705322265625, 0.014569282531738281, 0.017171859741210938, 0.019774436950683594, 0.02237701416015625, 0.024979591369628906, 0.027582168579101562, 0.03018474578857422, 0.032787322998046875, 0.03538990020751953, 0.03799247741699219, 0.040595054626464844, 0.0431976318359375, 0.045800209045410156, 0.04840278625488281, 0.05100536346435547, 0.053607940673828125, 0.05621051788330078, 0.05881309509277344, 0.061415672302246094, 0.06401824951171875, 0.0666208267211914, 0.06922340393066406, 0.07182598114013672, 0.07442855834960938, 0.07703113555908203, 0.07963371276855469, 0.08223628997802734, 0.0848388671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 9.0, 6.0, 10.0, 11.0, 16.0, 17.0, 31.0, 34.0, 44.0, 60.0, 87.0, 135.0, 235.0, 402.0, 898.0, 2814.0, 13502.0, 96934.0, 685053.0, 216064.0, 25023.0, 4625.0, 1230.0, 518.0, 275.0, 135.0, 120.0, 69.0, 52.0, 33.0, 32.0, 26.0, 14.0, 13.0, 13.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.297119140625, -0.2871055603027344, -0.27709197998046875, -0.2670783996582031, -0.2570648193359375, -0.24705123901367188, -0.23703765869140625, -0.22702407836914062, -0.217010498046875, -0.20699691772460938, -0.19698333740234375, -0.18696975708007812, -0.1769561767578125, -0.16694259643554688, -0.15692901611328125, -0.14691543579101562, -0.13690185546875, -0.12688827514648438, -0.11687469482421875, -0.10686111450195312, -0.0968475341796875, -0.08683395385742188, -0.07682037353515625, -0.06680679321289062, -0.056793212890625, -0.046779632568359375, -0.03676605224609375, -0.026752471923828125, -0.0167388916015625, -0.006725311279296875, 0.00328826904296875, 0.013301849365234375, 0.0233154296875, 0.033329010009765625, 0.04334259033203125, 0.053356170654296875, 0.0633697509765625, 0.07338333129882812, 0.08339691162109375, 0.09341049194335938, 0.103424072265625, 0.11343765258789062, 0.12345123291015625, 0.13346481323242188, 0.1434783935546875, 0.15349197387695312, 0.16350555419921875, 0.17351913452148438, 0.18353271484375, 0.19354629516601562, 0.20355987548828125, 0.21357345581054688, 0.2235870361328125, 0.23360061645507812, 0.24361419677734375, 0.2536277770996094, 0.263641357421875, 0.2736549377441406, 0.28366851806640625, 0.2936820983886719, 0.3036956787109375, 0.3137092590332031, 0.32372283935546875, 0.3337364196777344, 0.34375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 5.0, 11.0, 11.0, 13.0, 12.0, 12.0, 14.0, 17.0, 21.0, 24.0, 38.0, 32.0, 37.0, 53.0, 38.0, 56.0, 53.0, 47.0, 42.0, 38.0, 42.0, 46.0, 40.0, 45.0, 41.0, 33.0, 29.0, 20.0, 34.0, 16.0, 18.0, 14.0, 13.0, 11.0, 9.0, 8.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.294189453125, -0.2830467224121094, -0.27190399169921875, -0.2607612609863281, -0.2496185302734375, -0.23847579956054688, -0.22733306884765625, -0.21619033813476562, -0.205047607421875, -0.19390487670898438, -0.18276214599609375, -0.17161941528320312, -0.1604766845703125, -0.14933395385742188, -0.13819122314453125, -0.12704849243164062, -0.11590576171875, -0.10476303100585938, -0.09362030029296875, -0.08247756958007812, -0.0713348388671875, -0.060192108154296875, -0.04904937744140625, -0.037906646728515625, -0.026763916015625, -0.015621185302734375, -0.00447845458984375, 0.006664276123046875, 0.0178070068359375, 0.028949737548828125, 0.04009246826171875, 0.051235198974609375, 0.0623779296875, 0.07352066040039062, 0.08466339111328125, 0.09580612182617188, 0.1069488525390625, 0.11809158325195312, 0.12923431396484375, 0.14037704467773438, 0.151519775390625, 0.16266250610351562, 0.17380523681640625, 0.18494796752929688, 0.1960906982421875, 0.20723342895507812, 0.21837615966796875, 0.22951889038085938, 0.24066162109375, 0.2518043518066406, 0.26294708251953125, 0.2740898132324219, 0.2852325439453125, 0.2963752746582031, 0.30751800537109375, 0.3186607360839844, 0.329803466796875, 0.3409461975097656, 0.35208892822265625, 0.3632316589355469, 0.3743743896484375, 0.3855171203613281, 0.39665985107421875, 0.4078025817871094, 0.4189453125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 16.0, 25.0, 35.0, 43.0, 55.0, 83.0, 167.0, 244.0, 440.0, 817.0, 1569.0, 3377.0, 8172.0, 23337.0, 83266.0, 420177.0, 391448.0, 78051.0, 22509.0, 8005.0, 3276.0, 1544.0, 791.0, 420.0, 242.0, 157.0, 86.0, 59.0, 41.0, 31.0, 19.0, 11.0, 7.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07562255859375, -0.07310009002685547, -0.07057762145996094, -0.0680551528930664, -0.06553268432617188, -0.06301021575927734, -0.06048774719238281, -0.05796527862548828, -0.05544281005859375, -0.05292034149169922, -0.05039787292480469, -0.047875404357910156, -0.045352935791015625, -0.042830467224121094, -0.04030799865722656, -0.03778553009033203, -0.0352630615234375, -0.03274059295654297, -0.030218124389648438, -0.027695655822753906, -0.025173187255859375, -0.022650718688964844, -0.020128250122070312, -0.01760578155517578, -0.01508331298828125, -0.012560844421386719, -0.010038375854492188, -0.007515907287597656, -0.004993438720703125, -0.0024709701538085938, 5.14984130859375e-05, 0.0025739669799804688, 0.005096435546875, 0.007618904113769531, 0.010141372680664062, 0.012663841247558594, 0.015186309814453125, 0.017708778381347656, 0.020231246948242188, 0.02275371551513672, 0.02527618408203125, 0.02779865264892578, 0.030321121215820312, 0.032843589782714844, 0.035366058349609375, 0.037888526916503906, 0.04041099548339844, 0.04293346405029297, 0.0454559326171875, 0.04797840118408203, 0.05050086975097656, 0.053023338317871094, 0.055545806884765625, 0.058068275451660156, 0.06059074401855469, 0.06311321258544922, 0.06563568115234375, 0.06815814971923828, 0.07068061828613281, 0.07320308685302734, 0.07572555541992188, 0.0782480239868164, 0.08077049255371094, 0.08329296112060547, 0.0858154296875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 6.0, 3.0, 2.0, 4.0, 8.0, 11.0, 11.0, 34.0, 52.0, 55.0, 113.0, 140.0, 134.0, 132.0, 87.0, 83.0, 39.0, 23.0, 20.0, 19.0, 7.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5928020477294922e-05, -2.502184361219406e-05, -2.41156667470932e-05, -2.320948988199234e-05, -2.230331301689148e-05, -2.139713615179062e-05, -2.0490959286689758e-05, -1.9584782421588898e-05, -1.8678605556488037e-05, -1.7772428691387177e-05, -1.6866251826286316e-05, -1.5960074961185455e-05, -1.5053898096084595e-05, -1.4147721230983734e-05, -1.3241544365882874e-05, -1.2335367500782013e-05, -1.1429190635681152e-05, -1.0523013770580292e-05, -9.616836905479431e-06, -8.71066004037857e-06, -7.80448317527771e-06, -6.898306310176849e-06, -5.992129445075989e-06, -5.085952579975128e-06, -4.179775714874268e-06, -3.273598849773407e-06, -2.3674219846725464e-06, -1.4612451195716858e-06, -5.550682544708252e-07, 3.511086106300354e-07, 1.257285475730896e-06, 2.1634623408317566e-06, 3.069639205932617e-06, 3.975816071033478e-06, 4.881992936134338e-06, 5.788169801235199e-06, 6.6943466663360596e-06, 7.60052353143692e-06, 8.50670039653778e-06, 9.412877261638641e-06, 1.0319054126739502e-05, 1.1225230991840363e-05, 1.2131407856941223e-05, 1.3037584722042084e-05, 1.3943761587142944e-05, 1.4849938452243805e-05, 1.5756115317344666e-05, 1.6662292182445526e-05, 1.7568469047546387e-05, 1.8474645912647247e-05, 1.9380822777748108e-05, 2.028699964284897e-05, 2.119317650794983e-05, 2.209935337305069e-05, 2.300553023815155e-05, 2.391170710325241e-05, 2.481788396835327e-05, 2.5724060833454132e-05, 2.6630237698554993e-05, 2.7536414563655853e-05, 2.8442591428756714e-05, 2.9348768293857574e-05, 3.0254945158958435e-05, 3.1161122024059296e-05, 3.2067298889160156e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 11.0, 8.0, 15.0, 20.0, 23.0, 50.0, 55.0, 117.0, 198.0, 354.0, 630.0, 1316.0, 3012.0, 7903.0, 23744.0, 89839.0, 411352.0, 388927.0, 85158.0, 22612.0, 7470.0, 2958.0, 1306.0, 643.0, 330.0, 192.0, 110.0, 53.0, 40.0, 26.0, 19.0, 16.0, 17.0, 7.0, 4.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.07977294921875, -0.07711219787597656, -0.07445144653320312, -0.07179069519042969, -0.06912994384765625, -0.06646919250488281, -0.06380844116210938, -0.06114768981933594, -0.0584869384765625, -0.05582618713378906, -0.053165435791015625, -0.05050468444824219, -0.04784393310546875, -0.04518318176269531, -0.042522430419921875, -0.03986167907714844, -0.037200927734375, -0.03454017639160156, -0.031879425048828125, -0.029218673706054688, -0.02655792236328125, -0.023897171020507812, -0.021236419677734375, -0.018575668334960938, -0.0159149169921875, -0.013254165649414062, -0.010593414306640625, -0.007932662963867188, -0.00527191162109375, -0.0026111602783203125, 4.9591064453125e-05, 0.0027103424072265625, 0.00537109375, 0.008031845092773438, 0.010692596435546875, 0.013353347778320312, 0.01601409912109375, 0.018674850463867188, 0.021335601806640625, 0.023996353149414062, 0.0266571044921875, 0.029317855834960938, 0.031978607177734375, 0.03463935852050781, 0.03730010986328125, 0.03996086120605469, 0.042621612548828125, 0.04528236389160156, 0.047943115234375, 0.05060386657714844, 0.053264617919921875, 0.05592536926269531, 0.05858612060546875, 0.06124687194824219, 0.06390762329101562, 0.06656837463378906, 0.0692291259765625, 0.07188987731933594, 0.07455062866210938, 0.07721138000488281, 0.07987213134765625, 0.08253288269042969, 0.08519363403320312, 0.08785438537597656, 0.09051513671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 8.0, 7.0, 6.0, 5.0, 8.0, 17.0, 13.0, 22.0, 19.0, 34.0, 33.0, 45.0, 48.0, 54.0, 57.0, 62.0, 67.0, 68.0, 74.0, 58.0, 50.0, 46.0, 30.0, 30.0, 35.0, 15.0, 18.0, 20.0, 6.0, 10.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.07562255859375, -0.07322120666503906, -0.07081985473632812, -0.06841850280761719, -0.06601715087890625, -0.06361579895019531, -0.061214447021484375, -0.05881309509277344, -0.0564117431640625, -0.05401039123535156, -0.051609039306640625, -0.04920768737792969, -0.04680633544921875, -0.04440498352050781, -0.042003631591796875, -0.03960227966308594, -0.037200927734375, -0.03479957580566406, -0.032398223876953125, -0.029996871948242188, -0.02759552001953125, -0.025194168090820312, -0.022792816162109375, -0.020391464233398438, -0.0179901123046875, -0.015588760375976562, -0.013187408447265625, -0.010786056518554688, -0.00838470458984375, -0.0059833526611328125, -0.003582000732421875, -0.0011806488037109375, 0.001220703125, 0.0036220550537109375, 0.006023406982421875, 0.008424758911132812, 0.01082611083984375, 0.013227462768554688, 0.015628814697265625, 0.018030166625976562, 0.0204315185546875, 0.022832870483398438, 0.025234222412109375, 0.027635574340820312, 0.03003692626953125, 0.03243827819824219, 0.034839630126953125, 0.03724098205566406, 0.039642333984375, 0.04204368591308594, 0.044445037841796875, 0.04684638977050781, 0.04924774169921875, 0.05164909362792969, 0.054050445556640625, 0.05645179748535156, 0.0588531494140625, 0.06125450134277344, 0.06365585327148438, 0.06605720520019531, 0.06845855712890625, 0.07085990905761719, 0.07326126098632812, 0.07566261291503906, 0.07806396484375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 16.0, 43.0, 88.0, 150.0, 273.0, 208.0, 122.0, 61.0, 22.0, 9.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3032209873199463, -2.202120542526245, -2.101020097732544, -1.9999196529388428, -1.8988192081451416, -1.7977187633514404, -1.6966183185577393, -1.595517873764038, -1.494417428970337, -1.3933169841766357, -1.2922165393829346, -1.1911160945892334, -1.0900156497955322, -0.988915205001831, -0.8878147602081299, -0.7867143154144287, -0.6856138706207275, -0.5845134258270264, -0.4834129810333252, -0.382312536239624, -0.28121209144592285, -0.18011164665222168, -0.07901120185852051, 0.022089242935180664, 0.12318968772888184, 0.224290132522583, 0.3253905773162842, 0.42649102210998535, 0.5275914669036865, 0.6286919116973877, 0.7297923564910889, 0.83089280128479, 0.9319934844970703, 1.0330939292907715, 1.1341943740844727, 1.2352948188781738, 1.336395263671875, 1.4374957084655762, 1.5385961532592773, 1.6396965980529785, 1.7407970428466797, 1.8418974876403809, 1.942997932434082, 2.044098377227783, 2.1451988220214844, 2.2462992668151855, 2.3473997116088867, 2.448500156402588, 2.549600601196289, 2.6507010459899902, 2.7518014907836914, 2.8529019355773926, 2.9540023803710938, 3.055102825164795, 3.156203269958496, 3.2573037147521973, 3.3584041595458984, 3.4595046043395996, 3.560605049133301, 3.661705493927002, 3.762805938720703, 3.8639063835144043, 3.9650068283081055, 4.066107273101807, 4.167207717895508]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 2.0, 12.0, 13.0, 8.0, 16.0, 9.0, 20.0, 29.0, 22.0, 39.0, 34.0, 42.0, 39.0, 50.0, 57.0, 54.0, 58.0, 51.0, 43.0, 50.0, 51.0, 36.0, 44.0, 42.0, 27.0, 23.0, 26.0, 22.0, 16.0, 9.0, 16.0, 7.0, 8.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8342761993408203, -1.7787529230117798, -1.7232296466827393, -1.6677063703536987, -1.6121830940246582, -1.5566599369049072, -1.5011365413665771, -1.4456133842468262, -1.3900901079177856, -1.3345668315887451, -1.2790435552597046, -1.223520278930664, -1.1679970026016235, -1.112473726272583, -1.056950569152832, -1.0014272928237915, -0.9459039568901062, -0.8903806805610657, -0.8348574042320251, -0.7793341875076294, -0.7238109111785889, -0.6682876348495483, -0.6127643585205078, -0.5572410821914673, -0.5017178058624268, -0.44619452953338623, -0.3906712830066681, -0.33514800667762756, -0.2796247601509094, -0.2241014838218689, -0.16857820749282837, -0.11305496096611023, -0.05753171443939209, -0.002008449286222458, 0.053514815866947174, 0.1090380847454071, 0.16456134617328644, 0.22008460760116577, 0.2756078839302063, 0.33113113045692444, 0.38665440678596497, 0.4421776831150055, 0.49770092964172363, 0.5532242059707642, 0.6087474822998047, 0.6642707586288452, 0.7197940349578857, 0.7753172516822815, 0.830840528011322, 0.8863638043403625, 0.9418870806694031, 0.9974102973937988, 1.0529335737228394, 1.1084568500518799, 1.1639801263809204, 1.219503402709961, 1.2750266790390015, 1.330549955368042, 1.3860732316970825, 1.441596508026123, 1.4971197843551636, 1.552643060684204, 1.608166217803955, 1.6636894941329956, 1.7192127704620361]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 7.0, 7.0, 19.0, 17.0, 29.0, 53.0, 117.0, 238.0, 640.0, 4731.0, 4178819.0, 8170.0, 875.0, 254.0, 122.0, 68.0, 44.0, 27.0, 13.0, 6.0, 10.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.240234375, -1.2096710205078125, -1.179107666015625, -1.1485443115234375, -1.11798095703125, -1.0874176025390625, -1.056854248046875, -1.0262908935546875, -0.9957275390625, -0.9651641845703125, -0.934600830078125, -0.9040374755859375, -0.87347412109375, -0.8429107666015625, -0.812347412109375, -0.7817840576171875, -0.751220703125, -0.7206573486328125, -0.690093994140625, -0.6595306396484375, -0.62896728515625, -0.5984039306640625, -0.567840576171875, -0.5372772216796875, -0.5067138671875, -0.4761505126953125, -0.445587158203125, -0.4150238037109375, -0.38446044921875, -0.3538970947265625, -0.323333740234375, -0.2927703857421875, -0.26220703125, -0.2316436767578125, -0.201080322265625, -0.1705169677734375, -0.13995361328125, -0.1093902587890625, -0.078826904296875, -0.0482635498046875, -0.0177001953125, 0.0128631591796875, 0.043426513671875, 0.0739898681640625, 0.10455322265625, 0.1351165771484375, 0.165679931640625, 0.1962432861328125, 0.226806640625, 0.2573699951171875, 0.287933349609375, 0.3184967041015625, 0.34906005859375, 0.3796234130859375, 0.410186767578125, 0.4407501220703125, 0.4713134765625, 0.5018768310546875, 0.532440185546875, 0.5630035400390625, 0.59356689453125, 0.6241302490234375, 0.654693603515625, 0.6852569580078125, 0.7158203125]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 15.0, 16.0, 10.0, 18.0, 20.0, 15.0, 28.0, 42.0, 29.0, 38.0, 35.0, 53.0, 45.0, 56.0, 52.0, 55.0, 49.0, 56.0, 46.0, 50.0, 48.0, 33.0, 33.0, 19.0, 24.0, 23.0, 16.0, 11.0, 11.0, 17.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.088134765625, -0.08537673950195312, -0.08261871337890625, -0.07986068725585938, -0.0771026611328125, -0.07434463500976562, -0.07158660888671875, -0.06882858276367188, -0.066070556640625, -0.06331253051757812, -0.06055450439453125, -0.057796478271484375, -0.0550384521484375, -0.052280426025390625, -0.04952239990234375, -0.046764373779296875, -0.04400634765625, -0.041248321533203125, -0.03849029541015625, -0.035732269287109375, -0.0329742431640625, -0.030216217041015625, -0.02745819091796875, -0.024700164794921875, -0.021942138671875, -0.019184112548828125, -0.01642608642578125, -0.013668060302734375, -0.0109100341796875, -0.008152008056640625, -0.00539398193359375, -0.002635955810546875, 0.0001220703125, 0.002880096435546875, 0.00563812255859375, 0.008396148681640625, 0.0111541748046875, 0.013912200927734375, 0.01667022705078125, 0.019428253173828125, 0.022186279296875, 0.024944305419921875, 0.02770233154296875, 0.030460357666015625, 0.0332183837890625, 0.035976409912109375, 0.03873443603515625, 0.041492462158203125, 0.04425048828125, 0.047008514404296875, 0.04976654052734375, 0.052524566650390625, 0.0552825927734375, 0.058040618896484375, 0.06079864501953125, 0.06355667114257812, 0.066314697265625, 0.06907272338867188, 0.07183074951171875, 0.07458877563476562, 0.0773468017578125, 0.08010482788085938, 0.08286285400390625, 0.08562088012695312, 0.08837890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 4.0, 10.0, 6.0, 14.0, 21.0, 26.0, 36.0, 32.0, 65.0, 75.0, 93.0, 125.0, 173.0, 239.0, 349.0, 559.0, 1232.0, 3418.0, 28460.0, 4133849.0, 19712.0, 2950.0, 1064.0, 567.0, 321.0, 231.0, 160.0, 125.0, 88.0, 59.0, 59.0, 44.0, 36.0, 21.0, 17.0, 11.0, 12.0, 4.0, 4.0, 2.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42138671875, -0.407073974609375, -0.39276123046875, -0.378448486328125, -0.3641357421875, -0.349822998046875, -0.33551025390625, -0.321197509765625, -0.306884765625, -0.292572021484375, -0.27825927734375, -0.263946533203125, -0.2496337890625, -0.235321044921875, -0.22100830078125, -0.206695556640625, -0.1923828125, -0.178070068359375, -0.16375732421875, -0.149444580078125, -0.1351318359375, -0.120819091796875, -0.10650634765625, -0.092193603515625, -0.077880859375, -0.063568115234375, -0.04925537109375, -0.034942626953125, -0.0206298828125, -0.006317138671875, 0.00799560546875, 0.022308349609375, 0.03662109375, 0.050933837890625, 0.06524658203125, 0.079559326171875, 0.0938720703125, 0.108184814453125, 0.12249755859375, 0.136810302734375, 0.151123046875, 0.165435791015625, 0.17974853515625, 0.194061279296875, 0.2083740234375, 0.222686767578125, 0.23699951171875, 0.251312255859375, 0.265625, 0.279937744140625, 0.29425048828125, 0.308563232421875, 0.3228759765625, 0.337188720703125, 0.35150146484375, 0.365814208984375, 0.380126953125, 0.394439697265625, 0.40875244140625, 0.423065185546875, 0.4373779296875, 0.451690673828125, 0.46600341796875, 0.480316162109375, 0.49462890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 7.0, 7.0, 24.0, 90.0, 3460.0, 398.0, 45.0, 21.0, 14.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09515380859375, -0.09197330474853516, -0.08879280090332031, -0.08561229705810547, -0.08243179321289062, -0.07925128936767578, -0.07607078552246094, -0.0728902816772461, -0.06970977783203125, -0.0665292739868164, -0.06334877014160156, -0.06016826629638672, -0.056987762451171875, -0.05380725860595703, -0.05062675476074219, -0.047446250915527344, -0.0442657470703125, -0.041085243225097656, -0.03790473937988281, -0.03472423553466797, -0.031543731689453125, -0.02836322784423828, -0.025182723999023438, -0.022002220153808594, -0.01882171630859375, -0.015641212463378906, -0.012460708618164062, -0.009280204772949219, -0.006099700927734375, -0.0029191970825195312, 0.0002613067626953125, 0.0034418106079101562, 0.006622314453125, 0.009802818298339844, 0.012983322143554688, 0.01616382598876953, 0.019344329833984375, 0.02252483367919922, 0.025705337524414062, 0.028885841369628906, 0.03206634521484375, 0.035246849060058594, 0.03842735290527344, 0.04160785675048828, 0.044788360595703125, 0.04796886444091797, 0.05114936828613281, 0.054329872131347656, 0.0575103759765625, 0.060690879821777344, 0.06387138366699219, 0.06705188751220703, 0.07023239135742188, 0.07341289520263672, 0.07659339904785156, 0.0797739028930664, 0.08295440673828125, 0.0861349105834961, 0.08931541442871094, 0.09249591827392578, 0.09567642211914062, 0.09885692596435547, 0.10203742980957031, 0.10521793365478516, 0.1083984375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 1.0, 4.0, 10.0, 9.0, 26.0, 59.0, 65.0, 116.0, 137.0, 145.0, 141.0, 114.0, 75.0, 34.0, 32.0, 14.0, 9.0, 5.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19558745622634888, -0.18652373552322388, -0.17746001482009888, -0.16839627921581268, -0.15933255851268768, -0.15026883780956268, -0.1412051022052765, -0.1321413815021515, -0.12307766079902649, -0.11401394009590149, -0.10495021194219589, -0.0958864837884903, -0.0868227630853653, -0.0777590423822403, -0.0686953142285347, -0.0596315860748291, -0.0505678653717041, -0.0415041409432888, -0.032440416514873505, -0.023376692086458206, -0.014312967658042908, -0.005249243229627609, 0.003814481198787689, 0.012878209352493286, 0.021941930055618286, 0.031005654484033585, 0.04006937891244888, 0.04913310334086418, 0.05819682776927948, 0.06726054847240448, 0.07632427662611008, 0.08538800477981567, 0.09445172548294067, 0.10351544618606567, 0.11257917433977127, 0.12164290249347687, 0.13070662319660187, 0.13977034389972687, 0.14883407950401306, 0.15789780020713806, 0.16696152091026306, 0.17602524161338806, 0.18508896231651306, 0.19415269792079926, 0.20321641862392426, 0.21228013932704926, 0.22134387493133545, 0.23040759563446045, 0.23947131633758545, 0.24853503704071045, 0.25759875774383545, 0.26666247844696045, 0.27572619915008545, 0.28478994965553284, 0.29385367035865784, 0.30291739106178284, 0.31198111176490784, 0.32104483246803284, 0.33010855317115784, 0.33917227387428284, 0.3482360243797302, 0.3572997450828552, 0.3663634657859802, 0.3754271864891052, 0.3844909071922302]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 3.0, 4.0, 9.0, 9.0, 9.0, 11.0, 18.0, 17.0, 21.0, 26.0, 33.0, 37.0, 36.0, 43.0, 37.0, 43.0, 38.0, 42.0, 51.0, 42.0, 50.0, 54.0, 32.0, 36.0, 35.0, 33.0, 39.0, 27.0, 23.0, 18.0, 15.0, 21.0, 15.0, 20.0, 15.0, 11.0, 7.0, 8.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.151891827583313, -0.14798298478126526, -0.14407412707805634, -0.1401652693748474, -0.13625642657279968, -0.13234758377075195, -0.12843872606754303, -0.1245298758149147, -0.12062102556228638, -0.11671217530965805, -0.11280332505702972, -0.1088944748044014, -0.10498562455177307, -0.10107677429914474, -0.09716792404651642, -0.09325907379388809, -0.08935022354125977, -0.08544137328863144, -0.08153252303600311, -0.07762367278337479, -0.07371482253074646, -0.06980597227811813, -0.06589712202548981, -0.06198827177286148, -0.058079421520233154, -0.05417057126760483, -0.0502617210149765, -0.046352870762348175, -0.04244402050971985, -0.03853517025709152, -0.034626320004463196, -0.03071746975183487, -0.026808619499206543, -0.022899769246578217, -0.01899091899394989, -0.015082068741321564, -0.011173218488693237, -0.007264368236064911, -0.0033555179834365845, 0.0005533322691917419, 0.004462182521820068, 0.008371032774448395, 0.012279883027076721, 0.016188733279705048, 0.020097583532333374, 0.0240064337849617, 0.027915284037590027, 0.03182413429021835, 0.03573298454284668, 0.039641834795475006, 0.04355068504810333, 0.04745953530073166, 0.051368385553359985, 0.05527723580598831, 0.05918608605861664, 0.06309493631124496, 0.06700378656387329, 0.07091263681650162, 0.07482148706912994, 0.07873033732175827, 0.0826391875743866, 0.08654803782701492, 0.09045688807964325, 0.09436573833227158, 0.0982745885848999]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 6.0, 5.0, 16.0, 5.0, 11.0, 17.0, 23.0, 40.0, 44.0, 90.0, 154.0, 244.0, 428.0, 857.0, 2162.0, 6312.0, 23611.0, 131724.0, 607471.0, 225535.0, 36021.0, 8776.0, 2666.0, 1097.0, 526.0, 251.0, 168.0, 92.0, 58.0, 46.0, 29.0, 23.0, 15.0, 12.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.341552734375, -0.33139801025390625, -0.3212432861328125, -0.31108856201171875, -0.300933837890625, -0.29077911376953125, -0.2806243896484375, -0.27046966552734375, -0.26031494140625, -0.25016021728515625, -0.2400054931640625, -0.22985076904296875, -0.219696044921875, -0.20954132080078125, -0.1993865966796875, -0.18923187255859375, -0.1790771484375, -0.16892242431640625, -0.1587677001953125, -0.14861297607421875, -0.138458251953125, -0.12830352783203125, -0.1181488037109375, -0.10799407958984375, -0.09783935546875, -0.08768463134765625, -0.0775299072265625, -0.06737518310546875, -0.057220458984375, -0.04706573486328125, -0.0369110107421875, -0.02675628662109375, -0.0166015625, -0.00644683837890625, 0.0037078857421875, 0.01386260986328125, 0.024017333984375, 0.03417205810546875, 0.0443267822265625, 0.05448150634765625, 0.06463623046875, 0.07479095458984375, 0.0849456787109375, 0.09510040283203125, 0.105255126953125, 0.11540985107421875, 0.1255645751953125, 0.13571929931640625, 0.1458740234375, 0.15602874755859375, 0.1661834716796875, 0.17633819580078125, 0.186492919921875, 0.19664764404296875, 0.2068023681640625, 0.21695709228515625, 0.22711181640625, 0.23726654052734375, 0.2474212646484375, 0.25757598876953125, 0.267730712890625, 0.27788543701171875, 0.2880401611328125, 0.29819488525390625, 0.308349609375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 4.0, 6.0, 8.0, 9.0, 12.0, 21.0, 20.0, 20.0, 24.0, 28.0, 27.0, 38.0, 39.0, 39.0, 46.0, 39.0, 55.0, 60.0, 57.0, 53.0, 54.0, 42.0, 53.0, 43.0, 35.0, 24.0, 27.0, 17.0, 20.0, 17.0, 14.0, 15.0, 10.0, 5.0, 7.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08941650390625, -0.08659934997558594, -0.08378219604492188, -0.08096504211425781, -0.07814788818359375, -0.07533073425292969, -0.07251358032226562, -0.06969642639160156, -0.0668792724609375, -0.06406211853027344, -0.061244964599609375, -0.05842781066894531, -0.05561065673828125, -0.05279350280761719, -0.049976348876953125, -0.04715919494628906, -0.044342041015625, -0.04152488708496094, -0.038707733154296875, -0.03589057922363281, -0.03307342529296875, -0.030256271362304688, -0.027439117431640625, -0.024621963500976562, -0.0218048095703125, -0.018987655639648438, -0.016170501708984375, -0.013353347778320312, -0.01053619384765625, -0.0077190399169921875, -0.004901885986328125, -0.0020847320556640625, 0.000732421875, 0.0035495758056640625, 0.006366729736328125, 0.009183883666992188, 0.01200103759765625, 0.014818191528320312, 0.017635345458984375, 0.020452499389648438, 0.0232696533203125, 0.026086807250976562, 0.028903961181640625, 0.03172111511230469, 0.03453826904296875, 0.03735542297363281, 0.040172576904296875, 0.04298973083496094, 0.045806884765625, 0.04862403869628906, 0.051441192626953125, 0.05425834655761719, 0.05707550048828125, 0.05989265441894531, 0.06270980834960938, 0.06552696228027344, 0.0683441162109375, 0.07116127014160156, 0.07397842407226562, 0.07679557800292969, 0.07961273193359375, 0.08242988586425781, 0.08524703979492188, 0.08806419372558594, 0.09088134765625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 5.0, 7.0, 10.0, 18.0, 9.0, 12.0, 25.0, 27.0, 39.0, 42.0, 70.0, 111.0, 176.0, 333.0, 718.0, 1748.0, 5685.0, 24260.0, 173398.0, 690063.0, 124829.0, 19384.0, 4729.0, 1479.0, 553.0, 270.0, 153.0, 115.0, 68.0, 45.0, 39.0, 35.0, 14.0, 19.0, 18.0, 13.0, 7.0, 5.0, 8.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.309814453125, -0.3008155822753906, -0.29181671142578125, -0.2828178405761719, -0.2738189697265625, -0.2648200988769531, -0.25582122802734375, -0.24682235717773438, -0.237823486328125, -0.22882461547851562, -0.21982574462890625, -0.21082687377929688, -0.2018280029296875, -0.19282913208007812, -0.18383026123046875, -0.17483139038085938, -0.16583251953125, -0.15683364868164062, -0.14783477783203125, -0.13883590698242188, -0.1298370361328125, -0.12083816528320312, -0.11183929443359375, -0.10284042358398438, -0.093841552734375, -0.08484268188476562, -0.07584381103515625, -0.06684494018554688, -0.0578460693359375, -0.048847198486328125, -0.03984832763671875, -0.030849456787109375, -0.0218505859375, -0.012851715087890625, -0.00385284423828125, 0.005146026611328125, 0.0141448974609375, 0.023143768310546875, 0.03214263916015625, 0.041141510009765625, 0.050140380859375, 0.059139251708984375, 0.06813812255859375, 0.07713699340820312, 0.0861358642578125, 0.09513473510742188, 0.10413360595703125, 0.11313247680664062, 0.12213134765625, 0.13113021850585938, 0.14012908935546875, 0.14912796020507812, 0.1581268310546875, 0.16712570190429688, 0.17612457275390625, 0.18512344360351562, 0.194122314453125, 0.20312118530273438, 0.21212005615234375, 0.22111892700195312, 0.2301177978515625, 0.23911666870117188, 0.24811553955078125, 0.2571144104003906, 0.26611328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 2.0, 3.0, 7.0, 9.0, 6.0, 13.0, 6.0, 20.0, 22.0, 18.0, 31.0, 29.0, 36.0, 26.0, 41.0, 35.0, 36.0, 32.0, 37.0, 52.0, 40.0, 45.0, 48.0, 43.0, 36.0, 40.0, 29.0, 36.0, 31.0, 26.0, 25.0, 30.0, 18.0, 11.0, 21.0, 17.0, 16.0, 8.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.304931640625, -0.2956428527832031, -0.28635406494140625, -0.2770652770996094, -0.2677764892578125, -0.2584877014160156, -0.24919891357421875, -0.23991012573242188, -0.230621337890625, -0.22133255004882812, -0.21204376220703125, -0.20275497436523438, -0.1934661865234375, -0.18417739868164062, -0.17488861083984375, -0.16559982299804688, -0.15631103515625, -0.14702224731445312, -0.13773345947265625, -0.12844467163085938, -0.1191558837890625, -0.10986709594726562, -0.10057830810546875, -0.09128952026367188, -0.082000732421875, -0.07271194458007812, -0.06342315673828125, -0.054134368896484375, -0.0448455810546875, -0.035556793212890625, -0.02626800537109375, -0.016979217529296875, -0.0076904296875, 0.001598358154296875, 0.01088714599609375, 0.020175933837890625, 0.0294647216796875, 0.038753509521484375, 0.04804229736328125, 0.057331085205078125, 0.066619873046875, 0.07590866088867188, 0.08519744873046875, 0.09448623657226562, 0.1037750244140625, 0.11306381225585938, 0.12235260009765625, 0.13164138793945312, 0.14093017578125, 0.15021896362304688, 0.15950775146484375, 0.16879653930664062, 0.1780853271484375, 0.18737411499023438, 0.19666290283203125, 0.20595169067382812, 0.215240478515625, 0.22452926635742188, 0.23381805419921875, 0.24310684204101562, 0.2523956298828125, 0.2616844177246094, 0.27097320556640625, 0.2802619934082031, 0.28955078125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 2.0, 7.0, 9.0, 10.0, 13.0, 17.0, 20.0, 21.0, 38.0, 59.0, 108.0, 159.0, 304.0, 545.0, 1254.0, 3311.0, 11002.0, 75704.0, 801072.0, 132779.0, 15034.0, 4089.0, 1499.0, 673.0, 322.0, 168.0, 119.0, 76.0, 35.0, 32.0, 16.0, 17.0, 15.0, 10.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11529541015625, -0.11126422882080078, -0.10723304748535156, -0.10320186614990234, -0.09917068481445312, -0.0951395034790039, -0.09110832214355469, -0.08707714080810547, -0.08304595947265625, -0.07901477813720703, -0.07498359680175781, -0.0709524154663086, -0.06692123413085938, -0.06289005279541016, -0.05885887145996094, -0.05482769012451172, -0.0507965087890625, -0.04676532745361328, -0.04273414611816406, -0.038702964782714844, -0.034671783447265625, -0.030640602111816406, -0.026609420776367188, -0.02257823944091797, -0.01854705810546875, -0.014515876770019531, -0.010484695434570312, -0.006453514099121094, -0.002422332763671875, 0.0016088485717773438, 0.0056400299072265625, 0.009671211242675781, 0.013702392578125, 0.01773357391357422, 0.021764755249023438, 0.025795936584472656, 0.029827117919921875, 0.033858299255371094, 0.03788948059082031, 0.04192066192626953, 0.04595184326171875, 0.04998302459716797, 0.05401420593261719, 0.058045387268066406, 0.062076568603515625, 0.06610774993896484, 0.07013893127441406, 0.07417011260986328, 0.0782012939453125, 0.08223247528076172, 0.08626365661621094, 0.09029483795166016, 0.09432601928710938, 0.0983572006225586, 0.10238838195800781, 0.10641956329345703, 0.11045074462890625, 0.11448192596435547, 0.11851310729980469, 0.1225442886352539, 0.12657546997070312, 0.13060665130615234, 0.13463783264160156, 0.13866901397705078, 0.1427001953125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 6.0, 15.0, 23.0, 19.0, 38.0, 84.0, 95.0, 137.0, 154.0, 151.0, 93.0, 71.0, 40.0, 24.0, 12.0, 16.0, 9.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8715858459472656e-05, -1.7807818949222565e-05, -1.6899779438972473e-05, -1.599173992872238e-05, -1.508370041847229e-05, -1.4175660908222198e-05, -1.3267621397972107e-05, -1.2359581887722015e-05, -1.1451542377471924e-05, -1.0543502867221832e-05, -9.63546335697174e-06, -8.72742384672165e-06, -7.819384336471558e-06, -6.911344826221466e-06, -6.0033053159713745e-06, -5.095265805721283e-06, -4.187226295471191e-06, -3.2791867852211e-06, -2.3711472749710083e-06, -1.4631077647209167e-06, -5.550682544708252e-07, 3.5297125577926636e-07, 1.261010766029358e-06, 2.1690502762794495e-06, 3.077089786529541e-06, 3.9851292967796326e-06, 4.893168807029724e-06, 5.801208317279816e-06, 6.709247827529907e-06, 7.617287337779999e-06, 8.52532684803009e-06, 9.433366358280182e-06, 1.0341405868530273e-05, 1.1249445378780365e-05, 1.2157484889030457e-05, 1.3065524399280548e-05, 1.397356390953064e-05, 1.4881603419780731e-05, 1.5789642930030823e-05, 1.6697682440280914e-05, 1.7605721950531006e-05, 1.8513761460781097e-05, 1.942180097103119e-05, 2.032984048128128e-05, 2.1237879991531372e-05, 2.2145919501781464e-05, 2.3053959012031555e-05, 2.3961998522281647e-05, 2.4870038032531738e-05, 2.577807754278183e-05, 2.668611705303192e-05, 2.7594156563282013e-05, 2.8502196073532104e-05, 2.9410235583782196e-05, 3.0318275094032288e-05, 3.122631460428238e-05, 3.213435411453247e-05, 3.304239362478256e-05, 3.3950433135032654e-05, 3.4858472645282745e-05, 3.576651215553284e-05, 3.667455166578293e-05, 3.758259117603302e-05, 3.849063068628311e-05, 3.93986701965332e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 10.0, 13.0, 22.0, 21.0, 35.0, 49.0, 78.0, 160.0, 295.0, 833.0, 2964.0, 15651.0, 377604.0, 624325.0, 21210.0, 3504.0, 962.0, 375.0, 154.0, 87.0, 66.0, 43.0, 21.0, 19.0, 20.0, 6.0, 5.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2354736328125, -0.2295970916748047, -0.22372055053710938, -0.21784400939941406, -0.21196746826171875, -0.20609092712402344, -0.20021438598632812, -0.1943378448486328, -0.1884613037109375, -0.1825847625732422, -0.17670822143554688, -0.17083168029785156, -0.16495513916015625, -0.15907859802246094, -0.15320205688476562, -0.1473255157470703, -0.141448974609375, -0.1355724334716797, -0.12969589233398438, -0.12381935119628906, -0.11794281005859375, -0.11206626892089844, -0.10618972778320312, -0.10031318664550781, -0.0944366455078125, -0.08856010437011719, -0.08268356323242188, -0.07680702209472656, -0.07093048095703125, -0.06505393981933594, -0.059177398681640625, -0.05330085754394531, -0.04742431640625, -0.04154777526855469, -0.035671234130859375, -0.029794692993164062, -0.02391815185546875, -0.018041610717773438, -0.012165069580078125, -0.0062885284423828125, -0.0004119873046875, 0.0054645538330078125, 0.011341094970703125, 0.017217636108398438, 0.02309417724609375, 0.028970718383789062, 0.034847259521484375, 0.04072380065917969, 0.046600341796875, 0.05247688293457031, 0.058353424072265625, 0.06422996520996094, 0.07010650634765625, 0.07598304748535156, 0.08185958862304688, 0.08773612976074219, 0.0936126708984375, 0.09948921203613281, 0.10536575317382812, 0.11124229431152344, 0.11711883544921875, 0.12299537658691406, 0.12887191772460938, 0.1347484588623047, 0.140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 6.0, 26.0, 35.0, 64.0, 97.0, 150.0, 151.0, 158.0, 105.0, 77.0, 38.0, 24.0, 18.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1787109375, -0.17395973205566406, -0.16920852661132812, -0.1644573211669922, -0.15970611572265625, -0.1549549102783203, -0.15020370483398438, -0.14545249938964844, -0.1407012939453125, -0.13595008850097656, -0.13119888305664062, -0.1264476776123047, -0.12169647216796875, -0.11694526672363281, -0.11219406127929688, -0.10744285583496094, -0.102691650390625, -0.09794044494628906, -0.09318923950195312, -0.08843803405761719, -0.08368682861328125, -0.07893562316894531, -0.07418441772460938, -0.06943321228027344, -0.0646820068359375, -0.05993080139160156, -0.055179595947265625, -0.05042839050292969, -0.04567718505859375, -0.04092597961425781, -0.036174774169921875, -0.03142356872558594, -0.02667236328125, -0.021921157836914062, -0.017169952392578125, -0.012418746948242188, -0.00766754150390625, -0.0029163360595703125, 0.001834869384765625, 0.0065860748291015625, 0.0113372802734375, 0.016088485717773438, 0.020839691162109375, 0.025590896606445312, 0.03034210205078125, 0.03509330749511719, 0.039844512939453125, 0.04459571838378906, 0.049346923828125, 0.05409812927246094, 0.058849334716796875, 0.06360054016113281, 0.06835174560546875, 0.07310295104980469, 0.07785415649414062, 0.08260536193847656, 0.0873565673828125, 0.09210777282714844, 0.09685897827148438, 0.10161018371582031, 0.10636138916015625, 0.11111259460449219, 0.11586380004882812, 0.12061500549316406, 0.1253662109375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 19.0, 41.0, 134.0, 232.0, 279.0, 174.0, 76.0, 24.0, 11.0, 8.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7699514627456665, -1.6348768472671509, -1.4998022317886353, -1.3647276163101196, -1.229653000831604, -1.0945783853530884, -0.9595037698745728, -0.8244291543960571, -0.6893545389175415, -0.5542799234390259, -0.41920530796051025, -0.28413069248199463, -0.149056077003479, -0.013981461524963379, 0.12109315395355225, 0.25616776943206787, 0.3912423849105835, 0.5263170003890991, 0.6613916158676147, 0.7964662313461304, 0.931540846824646, 1.0666154623031616, 1.2016900777816772, 1.3367646932601929, 1.4718393087387085, 1.6069139242172241, 1.7419885396957397, 1.8770631551742554, 2.0121378898620605, 2.147212505340576, 2.282287120819092, 2.4173617362976074, 2.552436351776123, 2.6875109672546387, 2.8225855827331543, 2.95766019821167, 3.0927348136901855, 3.227809429168701, 3.362884044647217, 3.4979586601257324, 3.633033275604248, 3.7681078910827637, 3.9031825065612793, 4.038257122039795, 4.1733317375183105, 4.308406352996826, 4.443480968475342, 4.578555583953857, 4.713630199432373, 4.848704814910889, 4.983779430389404, 5.11885404586792, 5.2539286613464355, 5.389003276824951, 5.524077892303467, 5.659152507781982, 5.794227123260498, 5.929301738739014, 6.064376354217529, 6.199450969696045, 6.3345255851745605, 6.469600200653076, 6.604674816131592, 6.739749431610107, 6.874824047088623]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 4.0, 5.0, 4.0, 10.0, 8.0, 9.0, 16.0, 19.0, 24.0, 23.0, 33.0, 36.0, 35.0, 33.0, 42.0, 44.0, 52.0, 56.0, 83.0, 39.0, 62.0, 54.0, 40.0, 49.0, 39.0, 43.0, 24.0, 23.0, 19.0, 20.0, 8.0, 13.0, 8.0, 3.0, 7.0, 7.0, 3.0, 3.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0907747745513916, -2.0352001190185547, -1.9796255826950073, -1.92405104637146, -1.8684765100479126, -1.8129018545150757, -1.7573273181915283, -1.7017526626586914, -1.646178126335144, -1.5906035900115967, -1.5350289344787598, -1.4794543981552124, -1.423879861831665, -1.3683052062988281, -1.3127306699752808, -1.2571561336517334, -1.2015814781188965, -1.1460069417953491, -1.0904322862625122, -1.0348577499389648, -0.9792831540107727, -0.9237085580825806, -0.8681340217590332, -0.8125594258308411, -0.7569849491119385, -0.7014103531837463, -0.645835816860199, -0.5902612209320068, -0.5346866250038147, -0.47911205887794495, -0.4235374927520752, -0.36796289682388306, -0.3123883008956909, -0.25681373476982117, -0.20123913884162903, -0.14566457271575928, -0.09008999168872833, -0.03451541066169739, 0.021059155464172363, 0.0766337513923645, 0.13220831751823425, 0.1877828985452652, 0.24335747957229614, 0.2989320456981659, 0.35450661182403564, 0.4100812077522278, 0.46565577387809753, 0.5212303400039673, 0.5768049359321594, 0.6323795318603516, 0.6879540681838989, 0.7435286641120911, 0.7991032600402832, 0.8546777963638306, 0.9102523922920227, 0.9658269882202148, 1.0214015245437622, 1.0769760608673096, 1.1325507164001465, 1.1881252527236938, 1.2436997890472412, 1.2992744445800781, 1.3548489809036255, 1.4104235172271729, 1.4659981727600098]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 10.0, 13.0, 15.0, 22.0, 49.0, 70.0, 132.0, 303.0, 1096.0, 4188520.0, 3218.0, 428.0, 165.0, 103.0, 50.0, 30.0, 19.0, 14.0, 9.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.93359375, -3.8369140625, -3.740234375, -3.6435546875, -3.546875, -3.4501953125, -3.353515625, -3.2568359375, -3.16015625, -3.0634765625, -2.966796875, -2.8701171875, -2.7734375, -2.6767578125, -2.580078125, -2.4833984375, -2.38671875, -2.2900390625, -2.193359375, -2.0966796875, -2.0, -1.9033203125, -1.806640625, -1.7099609375, -1.61328125, -1.5166015625, -1.419921875, -1.3232421875, -1.2265625, -1.1298828125, -1.033203125, -0.9365234375, -0.83984375, -0.7431640625, -0.646484375, -0.5498046875, -0.453125, -0.3564453125, -0.259765625, -0.1630859375, -0.06640625, 0.0302734375, 0.126953125, 0.2236328125, 0.3203125, 0.4169921875, 0.513671875, 0.6103515625, 0.70703125, 0.8037109375, 0.900390625, 0.9970703125, 1.09375, 1.1904296875, 1.287109375, 1.3837890625, 1.48046875, 1.5771484375, 1.673828125, 1.7705078125, 1.8671875, 1.9638671875, 2.060546875, 2.1572265625, 2.25390625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 3.0, 5.0, 11.0, 8.0, 11.0, 16.0, 22.0, 26.0, 18.0, 28.0, 34.0, 33.0, 43.0, 64.0, 66.0, 62.0, 67.0, 52.0, 64.0, 63.0, 46.0, 39.0, 46.0, 32.0, 18.0, 22.0, 23.0, 29.0, 10.0, 12.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.103271484375, -0.10019683837890625, -0.0971221923828125, -0.09404754638671875, -0.090972900390625, -0.08789825439453125, -0.0848236083984375, -0.08174896240234375, -0.07867431640625, -0.07559967041015625, -0.0725250244140625, -0.06945037841796875, -0.066375732421875, -0.06330108642578125, -0.0602264404296875, -0.05715179443359375, -0.0540771484375, -0.05100250244140625, -0.0479278564453125, -0.04485321044921875, -0.041778564453125, -0.03870391845703125, -0.0356292724609375, -0.03255462646484375, -0.02947998046875, -0.02640533447265625, -0.0233306884765625, -0.02025604248046875, -0.017181396484375, -0.01410675048828125, -0.0110321044921875, -0.00795745849609375, -0.0048828125, -0.00180816650390625, 0.0012664794921875, 0.00434112548828125, 0.007415771484375, 0.01049041748046875, 0.0135650634765625, 0.01663970947265625, 0.01971435546875, 0.02278900146484375, 0.0258636474609375, 0.02893829345703125, 0.032012939453125, 0.03508758544921875, 0.0381622314453125, 0.04123687744140625, 0.0443115234375, 0.04738616943359375, 0.0504608154296875, 0.05353546142578125, 0.056610107421875, 0.05968475341796875, 0.0627593994140625, 0.06583404541015625, 0.06890869140625, 0.07198333740234375, 0.0750579833984375, 0.07813262939453125, 0.081207275390625, 0.08428192138671875, 0.0873565673828125, 0.09043121337890625, 0.093505859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 6.0, 4.0, 5.0, 7.0, 11.0, 8.0, 20.0, 22.0, 33.0, 34.0, 46.0, 58.0, 76.0, 89.0, 140.0, 191.0, 281.0, 349.0, 521.0, 1081.0, 3592.0, 4043329.0, 138512.0, 3035.0, 993.0, 526.0, 361.0, 235.0, 161.0, 140.0, 101.0, 74.0, 72.0, 42.0, 30.0, 30.0, 27.0, 18.0, 8.0, 5.0, 4.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62841796875, -0.6059341430664062, -0.5834503173828125, -0.5609664916992188, -0.538482666015625, -0.5159988403320312, -0.4935150146484375, -0.47103118896484375, -0.44854736328125, -0.42606353759765625, -0.4035797119140625, -0.38109588623046875, -0.358612060546875, -0.33612823486328125, -0.3136444091796875, -0.29116058349609375, -0.2686767578125, -0.24619293212890625, -0.2237091064453125, -0.20122528076171875, -0.178741455078125, -0.15625762939453125, -0.1337738037109375, -0.11128997802734375, -0.08880615234375, -0.06632232666015625, -0.0438385009765625, -0.02135467529296875, 0.001129150390625, 0.02361297607421875, 0.0460968017578125, 0.06858062744140625, 0.091064453125, 0.11354827880859375, 0.1360321044921875, 0.15851593017578125, 0.180999755859375, 0.20348358154296875, 0.2259674072265625, 0.24845123291015625, 0.27093505859375, 0.29341888427734375, 0.3159027099609375, 0.33838653564453125, 0.360870361328125, 0.38335418701171875, 0.4058380126953125, 0.42832183837890625, 0.4508056640625, 0.47328948974609375, 0.4957733154296875, 0.5182571411132812, 0.540740966796875, 0.5632247924804688, 0.5857086181640625, 0.6081924438476562, 0.63067626953125, 0.6531600952148438, 0.6756439208984375, 0.6981277465820312, 0.720611572265625, 0.7430953979492188, 0.7655792236328125, 0.7880630493164062, 0.810546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 9.0, 22.0, 166.0, 3822.0, 35.0, 17.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1837158203125, -0.1786365509033203, -0.17355728149414062, -0.16847801208496094, -0.16339874267578125, -0.15831947326660156, -0.15324020385742188, -0.1481609344482422, -0.1430816650390625, -0.1380023956298828, -0.13292312622070312, -0.12784385681152344, -0.12276458740234375, -0.11768531799316406, -0.11260604858398438, -0.10752677917480469, -0.102447509765625, -0.09736824035644531, -0.09228897094726562, -0.08720970153808594, -0.08213043212890625, -0.07705116271972656, -0.07197189331054688, -0.06689262390136719, -0.0618133544921875, -0.05673408508300781, -0.051654815673828125, -0.04657554626464844, -0.04149627685546875, -0.03641700744628906, -0.031337738037109375, -0.026258468627929688, -0.02117919921875, -0.016099929809570312, -0.011020660400390625, -0.0059413909912109375, -0.00086212158203125, 0.0042171478271484375, 0.009296417236328125, 0.014375686645507812, 0.0194549560546875, 0.024534225463867188, 0.029613494873046875, 0.03469276428222656, 0.03977203369140625, 0.04485130310058594, 0.049930572509765625, 0.05500984191894531, 0.060089111328125, 0.06516838073730469, 0.07024765014648438, 0.07532691955566406, 0.08040618896484375, 0.08548545837402344, 0.09056472778320312, 0.09564399719238281, 0.1007232666015625, 0.10580253601074219, 0.11088180541992188, 0.11596107482910156, 0.12104034423828125, 0.12611961364746094, 0.13119888305664062, 0.1362781524658203, 0.141357421875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 9.0, 32.0, 47.0, 83.0, 174.0, 252.0, 190.0, 94.0, 60.0, 28.0, 18.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3869783878326416, -0.3697558343410492, -0.3525332808494568, -0.335310697555542, -0.3180881440639496, -0.3008655905723572, -0.28364303708076477, -0.26642048358917236, -0.24919791519641876, -0.23197536170482635, -0.21475279331207275, -0.19753023982048035, -0.18030768632888794, -0.16308511793613434, -0.14586256444454193, -0.12863999605178833, -0.11141744256019592, -0.09419488161802292, -0.07697232067584991, -0.05974976718425751, -0.0425272062420845, -0.0253046452999115, -0.008082091808319092, 0.009140469133853912, 0.026363030076026917, 0.04358559101819992, 0.060808148235082626, 0.07803070545196533, 0.09525326639413834, 0.11247582733631134, 0.12969838082790375, 0.14692094922065735, 0.16414350271224976, 0.18136605620384216, 0.19858862459659576, 0.21581117808818817, 0.23303374648094177, 0.2502562999725342, 0.2674788534641266, 0.284701406955719, 0.3019239902496338, 0.3191465437412262, 0.3363690972328186, 0.3535916805267334, 0.3708142340183258, 0.3880367875099182, 0.4052593410015106, 0.422481894493103, 0.43970444798469543, 0.45692700147628784, 0.47414955496788025, 0.49137210845947266, 0.5085946917533875, 0.5258172750473022, 0.5430397987365723, 0.5602623820304871, 0.5774849057197571, 0.5947074890136719, 0.6119300127029419, 0.6291525959968567, 0.6463751196861267, 0.6635977029800415, 0.6808202266693115, 0.6980428099632263, 0.7152653932571411]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 5.0, 11.0, 8.0, 6.0, 15.0, 18.0, 9.0, 17.0, 24.0, 28.0, 36.0, 28.0, 33.0, 33.0, 42.0, 40.0, 45.0, 44.0, 38.0, 31.0, 42.0, 41.0, 44.0, 42.0, 48.0, 37.0, 35.0, 29.0, 25.0, 16.0, 26.0, 20.0, 15.0, 15.0, 16.0, 5.0, 3.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.16603094339370728, -0.16097138822078705, -0.15591183304786682, -0.1508522927761078, -0.14579273760318756, -0.14073318243026733, -0.1356736272573471, -0.13061407208442688, -0.12555453181266785, -0.12049497663974762, -0.11543542891740799, -0.11037587374448776, -0.10531632602214813, -0.1002567708492279, -0.09519721567630768, -0.09013766050338745, -0.08507810533046722, -0.080018550157547, -0.07495900243520737, -0.06989944726228714, -0.06483989953994751, -0.05978034436702728, -0.054720789194107056, -0.04966123774647713, -0.0446016862988472, -0.03954213485121727, -0.03448258340358734, -0.029423028230667114, -0.024363476783037186, -0.019303925335407257, -0.01424437202513218, -0.009184818714857101, -0.004125267267227173, 0.0009342851117253304, 0.0059938374906778336, 0.011053389869630337, 0.01611294224858284, 0.02117249369621277, 0.026232047006487846, 0.031291600316762924, 0.03635115176439285, 0.04141070321202278, 0.04647025465965271, 0.05152980983257294, 0.056589361280202866, 0.061648912727832794, 0.06670846790075302, 0.07176801562309265, 0.07682757079601288, 0.0818871259689331, 0.08694667369127274, 0.09200622886419296, 0.09706577658653259, 0.10212533175945282, 0.10718488693237305, 0.11224444210529327, 0.1173039898276329, 0.12236354500055313, 0.12742309272289276, 0.132482647895813, 0.13754220306873322, 0.14260175824165344, 0.14766129851341248, 0.1527208536863327, 0.15778040885925293]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 6.0, 16.0, 21.0, 24.0, 48.0, 78.0, 124.0, 227.0, 336.0, 595.0, 1262.0, 2556.0, 7397.0, 41443.0, 466448.0, 472909.0, 42384.0, 7456.0, 2514.0, 1182.0, 634.0, 347.0, 194.0, 122.0, 75.0, 52.0, 32.0, 19.0, 16.0, 15.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3232421875, -0.31127166748046875, -0.2993011474609375, -0.28733062744140625, -0.275360107421875, -0.26338958740234375, -0.2514190673828125, -0.23944854736328125, -0.22747802734375, -0.21550750732421875, -0.2035369873046875, -0.19156646728515625, -0.179595947265625, -0.16762542724609375, -0.1556549072265625, -0.14368438720703125, -0.1317138671875, -0.11974334716796875, -0.1077728271484375, -0.09580230712890625, -0.083831787109375, -0.07186126708984375, -0.0598907470703125, -0.04792022705078125, -0.03594970703125, -0.02397918701171875, -0.0120086669921875, -3.814697265625e-05, 0.011932373046875, 0.02390289306640625, 0.0358734130859375, 0.04784393310546875, 0.059814453125, 0.07178497314453125, 0.0837554931640625, 0.09572601318359375, 0.107696533203125, 0.11966705322265625, 0.1316375732421875, 0.14360809326171875, 0.15557861328125, 0.16754913330078125, 0.1795196533203125, 0.19149017333984375, 0.203460693359375, 0.21543121337890625, 0.2274017333984375, 0.23937225341796875, 0.2513427734375, 0.26331329345703125, 0.2752838134765625, 0.28725433349609375, 0.299224853515625, 0.31119537353515625, 0.3231658935546875, 0.33513641357421875, 0.34710693359375, 0.35907745361328125, 0.3710479736328125, 0.38301849365234375, 0.394989013671875, 0.40695953369140625, 0.4189300537109375, 0.43090057373046875, 0.44287109375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 7.0, 9.0, 16.0, 14.0, 7.0, 25.0, 23.0, 39.0, 24.0, 29.0, 38.0, 39.0, 65.0, 66.0, 57.0, 74.0, 53.0, 42.0, 53.0, 39.0, 50.0, 49.0, 38.0, 27.0, 20.0, 14.0, 14.0, 16.0, 11.0, 12.0, 9.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10833740234375, -0.10518360137939453, -0.10202980041503906, -0.0988759994506836, -0.09572219848632812, -0.09256839752197266, -0.08941459655761719, -0.08626079559326172, -0.08310699462890625, -0.07995319366455078, -0.07679939270019531, -0.07364559173583984, -0.07049179077148438, -0.0673379898071289, -0.06418418884277344, -0.06103038787841797, -0.0578765869140625, -0.05472278594970703, -0.05156898498535156, -0.048415184020996094, -0.045261383056640625, -0.042107582092285156, -0.03895378112792969, -0.03579998016357422, -0.03264617919921875, -0.02949237823486328, -0.026338577270507812, -0.023184776306152344, -0.020030975341796875, -0.016877174377441406, -0.013723373413085938, -0.010569572448730469, -0.007415771484375, -0.004261970520019531, -0.0011081695556640625, 0.0020456314086914062, 0.005199432373046875, 0.008353233337402344, 0.011507034301757812, 0.014660835266113281, 0.01781463623046875, 0.02096843719482422, 0.024122238159179688, 0.027276039123535156, 0.030429840087890625, 0.033583641052246094, 0.03673744201660156, 0.03989124298095703, 0.0430450439453125, 0.04619884490966797, 0.04935264587402344, 0.052506446838378906, 0.055660247802734375, 0.058814048767089844, 0.06196784973144531, 0.06512165069580078, 0.06827545166015625, 0.07142925262451172, 0.07458305358886719, 0.07773685455322266, 0.08089065551757812, 0.0840444564819336, 0.08719825744628906, 0.09035205841064453, 0.093505859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 4.0, 12.0, 6.0, 16.0, 18.0, 27.0, 43.0, 48.0, 86.0, 139.0, 210.0, 322.0, 599.0, 1148.0, 2610.0, 8375.0, 46839.0, 589491.0, 357225.0, 30393.0, 6391.0, 2170.0, 984.0, 533.0, 300.0, 196.0, 125.0, 82.0, 45.0, 34.0, 24.0, 12.0, 7.0, 6.0, 10.0, 10.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.300048828125, -0.29033660888671875, -0.2806243896484375, -0.27091217041015625, -0.261199951171875, -0.25148773193359375, -0.2417755126953125, -0.23206329345703125, -0.22235107421875, -0.21263885498046875, -0.2029266357421875, -0.19321441650390625, -0.183502197265625, -0.17378997802734375, -0.1640777587890625, -0.15436553955078125, -0.1446533203125, -0.13494110107421875, -0.1252288818359375, -0.11551666259765625, -0.105804443359375, -0.09609222412109375, -0.0863800048828125, -0.07666778564453125, -0.06695556640625, -0.05724334716796875, -0.0475311279296875, -0.03781890869140625, -0.028106689453125, -0.01839447021484375, -0.0086822509765625, 0.00102996826171875, 0.0107421875, 0.02045440673828125, 0.0301666259765625, 0.03987884521484375, 0.049591064453125, 0.05930328369140625, 0.0690155029296875, 0.07872772216796875, 0.08843994140625, 0.09815216064453125, 0.1078643798828125, 0.11757659912109375, 0.127288818359375, 0.13700103759765625, 0.1467132568359375, 0.15642547607421875, 0.1661376953125, 0.17584991455078125, 0.1855621337890625, 0.19527435302734375, 0.204986572265625, 0.21469879150390625, 0.2244110107421875, 0.23412322998046875, 0.24383544921875, 0.25354766845703125, 0.2632598876953125, 0.27297210693359375, 0.282684326171875, 0.29239654541015625, 0.3021087646484375, 0.31182098388671875, 0.321533203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 4.0, 6.0, 8.0, 10.0, 17.0, 16.0, 17.0, 14.0, 22.0, 25.0, 29.0, 30.0, 24.0, 38.0, 31.0, 35.0, 47.0, 37.0, 48.0, 40.0, 42.0, 47.0, 31.0, 37.0, 34.0, 37.0, 33.0, 28.0, 38.0, 23.0, 22.0, 18.0, 22.0, 15.0, 18.0, 6.0, 12.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.305419921875, -0.29595947265625, -0.2864990234375, -0.27703857421875, -0.267578125, -0.25811767578125, -0.2486572265625, -0.23919677734375, -0.229736328125, -0.22027587890625, -0.2108154296875, -0.20135498046875, -0.19189453125, -0.18243408203125, -0.1729736328125, -0.16351318359375, -0.154052734375, -0.14459228515625, -0.1351318359375, -0.12567138671875, -0.1162109375, -0.10675048828125, -0.0972900390625, -0.08782958984375, -0.078369140625, -0.06890869140625, -0.0594482421875, -0.04998779296875, -0.04052734375, -0.03106689453125, -0.0216064453125, -0.01214599609375, -0.002685546875, 0.00677490234375, 0.0162353515625, 0.02569580078125, 0.03515625, 0.04461669921875, 0.0540771484375, 0.06353759765625, 0.072998046875, 0.08245849609375, 0.0919189453125, 0.10137939453125, 0.11083984375, 0.12030029296875, 0.1297607421875, 0.13922119140625, 0.148681640625, 0.15814208984375, 0.1676025390625, 0.17706298828125, 0.1865234375, 0.19598388671875, 0.2054443359375, 0.21490478515625, 0.224365234375, 0.23382568359375, 0.2432861328125, 0.25274658203125, 0.26220703125, 0.27166748046875, 0.2811279296875, 0.29058837890625, 0.300048828125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 13.0, 25.0, 27.0, 46.0, 65.0, 150.0, 345.0, 863.0, 2549.0, 10837.0, 104888.0, 860477.0, 57271.0, 7702.0, 2033.0, 664.0, 300.0, 118.0, 55.0, 44.0, 23.0, 13.0, 15.0, 6.0, 1.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.13478660583496094, -0.12968063354492188, -0.12457466125488281, -0.11946868896484375, -0.11436271667480469, -0.10925674438476562, -0.10415077209472656, -0.0990447998046875, -0.09393882751464844, -0.08883285522460938, -0.08372688293457031, -0.07862091064453125, -0.07351493835449219, -0.06840896606445312, -0.06330299377441406, -0.058197021484375, -0.05309104919433594, -0.047985076904296875, -0.04287910461425781, -0.03777313232421875, -0.03266716003417969, -0.027561187744140625, -0.022455215454101562, -0.0173492431640625, -0.012243270874023438, -0.007137298583984375, -0.0020313262939453125, 0.00307464599609375, 0.008180618286132812, 0.013286590576171875, 0.018392562866210938, 0.02349853515625, 0.028604507446289062, 0.033710479736328125, 0.03881645202636719, 0.04392242431640625, 0.04902839660644531, 0.054134368896484375, 0.05924034118652344, 0.0643463134765625, 0.06945228576660156, 0.07455825805664062, 0.07966423034667969, 0.08477020263671875, 0.08987617492675781, 0.09498214721679688, 0.10008811950683594, 0.105194091796875, 0.11030006408691406, 0.11540603637695312, 0.12051200866699219, 0.12561798095703125, 0.1307239532470703, 0.13582992553710938, 0.14093589782714844, 0.1460418701171875, 0.15114784240722656, 0.15625381469726562, 0.1613597869873047, 0.16646575927734375, 0.1715717315673828, 0.17667770385742188, 0.18178367614746094, 0.1868896484375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 11.0, 6.0, 14.0, 23.0, 49.0, 60.0, 113.0, 168.0, 185.0, 146.0, 97.0, 51.0, 28.0, 17.0, 12.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.6193599700927734e-05, -4.5124441385269165e-05, -4.4055283069610596e-05, -4.2986124753952026e-05, -4.191696643829346e-05, -4.084780812263489e-05, -3.977864980697632e-05, -3.870949149131775e-05, -3.764033317565918e-05, -3.657117486000061e-05, -3.550201654434204e-05, -3.443285822868347e-05, -3.33636999130249e-05, -3.229454159736633e-05, -3.1225383281707764e-05, -3.0156224966049194e-05, -2.9087066650390625e-05, -2.8017908334732056e-05, -2.6948750019073486e-05, -2.5879591703414917e-05, -2.4810433387756348e-05, -2.374127507209778e-05, -2.267211675643921e-05, -2.160295844078064e-05, -2.053380012512207e-05, -1.94646418094635e-05, -1.839548349380493e-05, -1.7326325178146362e-05, -1.6257166862487793e-05, -1.5188008546829224e-05, -1.4118850231170654e-05, -1.3049691915512085e-05, -1.1980533599853516e-05, -1.0911375284194946e-05, -9.842216968536377e-06, -8.773058652877808e-06, -7.703900337219238e-06, -6.634742021560669e-06, -5.5655837059021e-06, -4.49642539024353e-06, -3.427267074584961e-06, -2.3581087589263916e-06, -1.2889504432678223e-06, -2.1979212760925293e-07, 8.493661880493164e-07, 1.9185245037078857e-06, 2.987682819366455e-06, 4.056841135025024e-06, 5.125999450683594e-06, 6.195157766342163e-06, 7.264316082000732e-06, 8.333474397659302e-06, 9.402632713317871e-06, 1.047179102897644e-05, 1.154094934463501e-05, 1.2610107660293579e-05, 1.3679265975952148e-05, 1.4748424291610718e-05, 1.5817582607269287e-05, 1.6886740922927856e-05, 1.7955899238586426e-05, 1.9025057554244995e-05, 2.0094215869903564e-05, 2.1163374185562134e-05, 2.2232532501220703e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 4.0, 8.0, 17.0, 15.0, 27.0, 25.0, 64.0, 65.0, 126.0, 201.0, 367.0, 731.0, 1382.0, 2978.0, 7961.0, 28409.0, 236301.0, 684549.0, 62797.0, 13615.0, 4821.0, 1999.0, 934.0, 471.0, 251.0, 168.0, 91.0, 56.0, 40.0, 23.0, 16.0, 9.0, 9.0, 9.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1346435546875, -0.13070964813232422, -0.12677574157714844, -0.12284183502197266, -0.11890792846679688, -0.1149740219116211, -0.11104011535644531, -0.10710620880126953, -0.10317230224609375, -0.09923839569091797, -0.09530448913574219, -0.0913705825805664, -0.08743667602539062, -0.08350276947021484, -0.07956886291503906, -0.07563495635986328, -0.0717010498046875, -0.06776714324951172, -0.06383323669433594, -0.059899330139160156, -0.055965423583984375, -0.052031517028808594, -0.04809761047363281, -0.04416370391845703, -0.04022979736328125, -0.03629589080810547, -0.03236198425292969, -0.028428077697753906, -0.024494171142578125, -0.020560264587402344, -0.016626358032226562, -0.012692451477050781, -0.008758544921875, -0.004824638366699219, -0.0008907318115234375, 0.0030431747436523438, 0.006977081298828125, 0.010910987854003906, 0.014844894409179688, 0.01877880096435547, 0.02271270751953125, 0.02664661407470703, 0.030580520629882812, 0.034514427185058594, 0.038448333740234375, 0.042382240295410156, 0.04631614685058594, 0.05025005340576172, 0.0541839599609375, 0.05811786651611328, 0.06205177307128906, 0.06598567962646484, 0.06991958618164062, 0.0738534927368164, 0.07778739929199219, 0.08172130584716797, 0.08565521240234375, 0.08958911895751953, 0.09352302551269531, 0.0974569320678711, 0.10139083862304688, 0.10532474517822266, 0.10925865173339844, 0.11319255828857422, 0.11712646484375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 4.0, 4.0, 3.0, 9.0, 12.0, 15.0, 35.0, 82.0, 193.0, 235.0, 191.0, 96.0, 47.0, 21.0, 11.0, 8.0, 6.0, 6.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2548828125, -0.24652862548828125, -0.2381744384765625, -0.22982025146484375, -0.221466064453125, -0.21311187744140625, -0.2047576904296875, -0.19640350341796875, -0.18804931640625, -0.17969512939453125, -0.1713409423828125, -0.16298675537109375, -0.154632568359375, -0.14627838134765625, -0.1379241943359375, -0.12957000732421875, -0.1212158203125, -0.11286163330078125, -0.1045074462890625, -0.09615325927734375, -0.087799072265625, -0.07944488525390625, -0.0710906982421875, -0.06273651123046875, -0.05438232421875, -0.04602813720703125, -0.0376739501953125, -0.02931976318359375, -0.020965576171875, -0.01261138916015625, -0.0042572021484375, 0.00409698486328125, 0.012451171875, 0.02080535888671875, 0.0291595458984375, 0.03751373291015625, 0.045867919921875, 0.05422210693359375, 0.0625762939453125, 0.07093048095703125, 0.07928466796875, 0.08763885498046875, 0.0959930419921875, 0.10434722900390625, 0.112701416015625, 0.12105560302734375, 0.1294097900390625, 0.13776397705078125, 0.1461181640625, 0.15447235107421875, 0.1628265380859375, 0.17118072509765625, 0.179534912109375, 0.18788909912109375, 0.1962432861328125, 0.20459747314453125, 0.21295166015625, 0.22130584716796875, 0.2296600341796875, 0.23801422119140625, 0.246368408203125, 0.25472259521484375, 0.2630767822265625, 0.27143096923828125, 0.27978515625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 13.0, 20.0, 36.0, 60.0, 85.0, 135.0, 146.0, 167.0, 140.0, 73.0, 54.0, 28.0, 15.0, 14.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9301108121871948, -1.863906979560852, -1.7977031469345093, -1.731499195098877, -1.6652953624725342, -1.5990915298461914, -1.5328876972198486, -1.4666838645935059, -1.400480031967163, -1.3342761993408203, -1.2680723667144775, -1.2018685340881348, -1.1356645822525024, -1.0694607496261597, -1.003256916999817, -0.9370530843734741, -0.8708491325378418, -0.804645299911499, -0.7384414076805115, -0.6722375750541687, -0.6060336828231812, -0.5398298501968384, -0.4736260175704956, -0.40742215514183044, -0.3412182927131653, -0.2750144302845001, -0.20881058275699615, -0.1426067352294922, -0.07640287280082703, -0.010199010372161865, 0.05600482225418091, 0.12220868468284607, 0.18841242790222168, 0.25461629033088684, 0.320820152759552, 0.3870239853858948, 0.45322784781455994, 0.5194317102432251, 0.5856355428695679, 0.6518393754959106, 0.7180432677268982, 0.784247100353241, 0.8504509925842285, 0.9166548252105713, 0.9828586578369141, 1.0490624904632568, 1.1152663230895996, 1.181470274925232, 1.2476741075515747, 1.3138779401779175, 1.3800817728042603, 1.4462857246398926, 1.5124895572662354, 1.5786933898925781, 1.644897222518921, 1.7111010551452637, 1.7773048877716064, 1.8435087203979492, 1.909712553024292, 1.9759163856506348, 2.0421202182769775, 2.1083240509033203, 2.174528121948242, 2.240731954574585, 2.3069357872009277]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 8.0, 7.0, 11.0, 5.0, 16.0, 12.0, 15.0, 24.0, 19.0, 19.0, 36.0, 20.0, 42.0, 35.0, 46.0, 29.0, 52.0, 38.0, 42.0, 50.0, 51.0, 41.0, 40.0, 33.0, 43.0, 39.0, 23.0, 34.0, 29.0, 20.0, 21.0, 16.0, 9.0, 13.0, 8.0, 11.0, 10.0, 2.0, 8.0, 1.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-1.6376512050628662, -1.5897202491760254, -1.5417894124984741, -1.4938584566116333, -1.4459275007247925, -1.3979965448379517, -1.3500657081604004, -1.3021347522735596, -1.2542037963867188, -1.206272840499878, -1.1583420038223267, -1.1104110479354858, -1.062480092048645, -1.0145491361618042, -0.9666182994842529, -0.9186873435974121, -0.8707564473152161, -0.82282555103302, -0.7748945951461792, -0.7269636988639832, -0.6790327429771423, -0.6311018466949463, -0.5831708908081055, -0.5352399945259094, -0.487309068441391, -0.43937814235687256, -0.3914472162723541, -0.3435162901878357, -0.29558539390563965, -0.24765445291996002, -0.19972354173660278, -0.15179261565208435, -0.10386168956756592, -0.055930767208337784, -0.00799984484910965, 0.039931073784828186, 0.08786199986934662, 0.13579292595386505, 0.1837238371372223, 0.23165476322174072, 0.27958568930625916, 0.3275166153907776, 0.375447541475296, 0.42337846755981445, 0.4713093638420105, 0.5192403197288513, 0.5671712160110474, 0.6151021718978882, 0.6630330681800842, 0.7109639644622803, 0.7588949203491211, 0.8068258166313171, 0.854756772518158, 0.902687668800354, 0.9506186246871948, 0.9985495209693909, 1.046480417251587, 1.0944113731384277, 1.142342209815979, 1.1902731657028198, 1.2382041215896606, 1.2861350774765015, 1.3340659141540527, 1.3819968700408936, 1.4299278259277344]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 10.0, 16.0, 21.0, 40.0, 63.0, 72.0, 122.0, 256.0, 2084.0, 4187302.0, 3525.0, 393.0, 132.0, 79.0, 60.0, 32.0, 26.0, 11.0, 9.0, 7.0, 8.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.086029052734375, -3.00604248046875, -2.926055908203125, -2.8460693359375, -2.766082763671875, -2.68609619140625, -2.606109619140625, -2.526123046875, -2.446136474609375, -2.36614990234375, -2.286163330078125, -2.2061767578125, -2.126190185546875, -2.04620361328125, -1.966217041015625, -1.88623046875, -1.806243896484375, -1.72625732421875, -1.646270751953125, -1.5662841796875, -1.486297607421875, -1.40631103515625, -1.326324462890625, -1.246337890625, -1.166351318359375, -1.08636474609375, -1.006378173828125, -0.9263916015625, -0.846405029296875, -0.76641845703125, -0.686431884765625, -0.6064453125, -0.526458740234375, -0.44647216796875, -0.366485595703125, -0.2864990234375, -0.206512451171875, -0.12652587890625, -0.046539306640625, 0.033447265625, 0.113433837890625, 0.19342041015625, 0.273406982421875, 0.3533935546875, 0.433380126953125, 0.51336669921875, 0.593353271484375, 0.67333984375, 0.753326416015625, 0.83331298828125, 0.913299560546875, 0.9932861328125, 1.073272705078125, 1.15325927734375, 1.233245849609375, 1.313232421875, 1.393218994140625, 1.47320556640625, 1.553192138671875, 1.6331787109375, 1.713165283203125, 1.79315185546875, 1.873138427734375, 1.953125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 9.0, 0.0, 5.0, 13.0, 6.0, 7.0, 17.0, 13.0, 18.0, 25.0, 21.0, 20.0, 45.0, 43.0, 37.0, 47.0, 50.0, 63.0, 70.0, 50.0, 56.0, 42.0, 56.0, 52.0, 49.0, 30.0, 24.0, 20.0, 32.0, 22.0, 8.0, 17.0, 17.0, 9.0, 4.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.10052490234375, -0.09747028350830078, -0.09441566467285156, -0.09136104583740234, -0.08830642700195312, -0.0852518081665039, -0.08219718933105469, -0.07914257049560547, -0.07608795166015625, -0.07303333282470703, -0.06997871398925781, -0.0669240951538086, -0.06386947631835938, -0.060814857482910156, -0.05776023864746094, -0.05470561981201172, -0.0516510009765625, -0.04859638214111328, -0.04554176330566406, -0.042487144470214844, -0.039432525634765625, -0.036377906799316406, -0.03332328796386719, -0.03026866912841797, -0.02721405029296875, -0.02415943145751953, -0.021104812622070312, -0.018050193786621094, -0.014995574951171875, -0.011940956115722656, -0.008886337280273438, -0.005831718444824219, -0.002777099609375, 0.00027751922607421875, 0.0033321380615234375, 0.006386756896972656, 0.009441375732421875, 0.012495994567871094, 0.015550613403320312, 0.01860523223876953, 0.02165985107421875, 0.02471446990966797, 0.027769088745117188, 0.030823707580566406, 0.033878326416015625, 0.036932945251464844, 0.03998756408691406, 0.04304218292236328, 0.0460968017578125, 0.04915142059326172, 0.05220603942871094, 0.055260658264160156, 0.058315277099609375, 0.061369895935058594, 0.06442451477050781, 0.06747913360595703, 0.07053375244140625, 0.07358837127685547, 0.07664299011230469, 0.0796976089477539, 0.08275222778320312, 0.08580684661865234, 0.08886146545410156, 0.09191608428955078, 0.094970703125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 9.0, 11.0, 21.0, 16.0, 23.0, 27.0, 28.0, 38.0, 45.0, 74.0, 69.0, 95.0, 129.0, 207.0, 284.0, 476.0, 871.0, 2155.0, 13028.0, 4147548.0, 23583.0, 2840.0, 1012.0, 526.0, 307.0, 226.0, 162.0, 109.0, 90.0, 70.0, 41.0, 35.0, 31.0, 26.0, 12.0, 12.0, 9.0, 5.0, 12.0, 1.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.75732421875, -0.7317352294921875, -0.706146240234375, -0.6805572509765625, -0.65496826171875, -0.6293792724609375, -0.603790283203125, -0.5782012939453125, -0.5526123046875, -0.5270233154296875, -0.501434326171875, -0.4758453369140625, -0.45025634765625, -0.4246673583984375, -0.399078369140625, -0.3734893798828125, -0.347900390625, -0.3223114013671875, -0.296722412109375, -0.2711334228515625, -0.24554443359375, -0.2199554443359375, -0.194366455078125, -0.1687774658203125, -0.1431884765625, -0.1175994873046875, -0.092010498046875, -0.0664215087890625, -0.04083251953125, -0.0152435302734375, 0.010345458984375, 0.0359344482421875, 0.0615234375, 0.0871124267578125, 0.112701416015625, 0.1382904052734375, 0.16387939453125, 0.1894683837890625, 0.215057373046875, 0.2406463623046875, 0.2662353515625, 0.2918243408203125, 0.317413330078125, 0.3430023193359375, 0.36859130859375, 0.3941802978515625, 0.419769287109375, 0.4453582763671875, 0.470947265625, 0.4965362548828125, 0.522125244140625, 0.5477142333984375, 0.57330322265625, 0.5988922119140625, 0.624481201171875, 0.6500701904296875, 0.6756591796875, 0.7012481689453125, 0.726837158203125, 0.7524261474609375, 0.77801513671875, 0.8036041259765625, 0.829193115234375, 0.8547821044921875, 0.88037109375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 11.0, 20.0, 48.0, 245.0, 3561.0, 120.0, 27.0, 20.0, 9.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1390380859375, -0.1314678192138672, -0.12389755249023438, -0.11632728576660156, -0.10875701904296875, -0.10118675231933594, -0.09361648559570312, -0.08604621887207031, -0.0784759521484375, -0.07090568542480469, -0.06333541870117188, -0.05576515197753906, -0.04819488525390625, -0.04062461853027344, -0.033054351806640625, -0.025484085083007812, -0.017913818359375, -0.010343551635742188, -0.002773284912109375, 0.0047969818115234375, 0.01236724853515625, 0.019937515258789062, 0.027507781982421875, 0.03507804870605469, 0.0426483154296875, 0.05021858215332031, 0.057788848876953125, 0.06535911560058594, 0.07292938232421875, 0.08049964904785156, 0.08806991577148438, 0.09564018249511719, 0.10321044921875, 0.11078071594238281, 0.11835098266601562, 0.12592124938964844, 0.13349151611328125, 0.14106178283691406, 0.14863204956054688, 0.1562023162841797, 0.1637725830078125, 0.1713428497314453, 0.17891311645507812, 0.18648338317871094, 0.19405364990234375, 0.20162391662597656, 0.20919418334960938, 0.2167644500732422, 0.224334716796875, 0.2319049835205078, 0.23947525024414062, 0.24704551696777344, 0.25461578369140625, 0.26218605041503906, 0.2697563171386719, 0.2773265838623047, 0.2848968505859375, 0.2924671173095703, 0.3000373840332031, 0.30760765075683594, 0.31517791748046875, 0.32274818420410156, 0.3303184509277344, 0.3378887176513672, 0.345458984375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 11.0, 16.0, 27.0, 75.0, 102.0, 153.0, 236.0, 160.0, 92.0, 74.0, 22.0, 11.0, 12.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.550527811050415, -1.5156991481781006, -1.4808706045150757, -1.4460419416427612, -1.4112132787704468, -1.3763846158981323, -1.3415560722351074, -1.306727409362793, -1.2718987464904785, -1.237070083618164, -1.2022415399551392, -1.1674128770828247, -1.1325842142105103, -1.0977555513381958, -1.062927007675171, -1.0280983448028564, -0.9932697415351868, -0.9584411382675171, -0.9236124753952026, -0.888783872127533, -0.8539552092552185, -0.8191266059875488, -0.7842979431152344, -0.7494693398475647, -0.714640736579895, -0.6798121333122253, -0.6449834704399109, -0.6101548671722412, -0.5753262042999268, -0.5404976010322571, -0.5056689977645874, -0.47084033489227295, -0.43601173162460327, -0.4011830985546112, -0.36635446548461914, -0.33152586221694946, -0.296697199344635, -0.26186859607696533, -0.22703996300697327, -0.1922113299369812, -0.15738269686698914, -0.12255406379699707, -0.0877254381775856, -0.05289681255817413, -0.018068179488182068, 0.016760453581809998, 0.05158907175064087, 0.08641770482063293, 0.121246337890625, 0.15607497096061707, 0.19090360403060913, 0.22573222219944, 0.26056087017059326, 0.29538947343826294, 0.330218106508255, 0.36504673957824707, 0.39987537264823914, 0.4347040057182312, 0.46953263878822327, 0.5043612718582153, 0.539189875125885, 0.5740185379981995, 0.6088471412658691, 0.6436758041381836, 0.6785044074058533]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 8.0, 7.0, 8.0, 8.0, 16.0, 22.0, 31.0, 38.0, 49.0, 51.0, 54.0, 74.0, 74.0, 86.0, 64.0, 73.0, 69.0, 70.0, 49.0, 46.0, 28.0, 23.0, 14.0, 14.0, 10.0, 8.0, 2.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5241246819496155, -0.5081518292427063, -0.49217894673347473, -0.47620606422424316, -0.4602331817150116, -0.44426029920578003, -0.42828744649887085, -0.4123145639896393, -0.3963416814804077, -0.38036879897117615, -0.36439594626426697, -0.3484230637550354, -0.33245018124580383, -0.31647729873657227, -0.3005044460296631, -0.2845315635204315, -0.26855871081352234, -0.25258582830429077, -0.2366129606962204, -0.22064009308815002, -0.20466721057891846, -0.18869434297084808, -0.1727214753627777, -0.15674859285354614, -0.14077572524547577, -0.1248028501868248, -0.10882997512817383, -0.09285710752010345, -0.07688423246145248, -0.060911357402801514, -0.04493848979473114, -0.02896561473608017, -0.0129927396774292, 0.002980133518576622, 0.018953006714582443, 0.034925878047943115, 0.050898753106594086, 0.06687162816524506, 0.08284449577331543, 0.0988173708319664, 0.11479024589061737, 0.13076311349868774, 0.1467359960079193, 0.16270886361598969, 0.17868173122406006, 0.19465461373329163, 0.210627481341362, 0.22660034894943237, 0.24257323145866394, 0.2585461139678955, 0.2745189666748047, 0.29049184918403625, 0.3064647316932678, 0.322437584400177, 0.33841046690940857, 0.35438334941864014, 0.3703562021255493, 0.3863290846347809, 0.40230193734169006, 0.41827481985092163, 0.4342477023601532, 0.45022058486938477, 0.46619343757629395, 0.4821663200855255, 0.4981392025947571]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 8.0, 5.0, 13.0, 26.0, 35.0, 56.0, 69.0, 103.0, 168.0, 274.0, 478.0, 963.0, 2003.0, 4051.0, 9154.0, 22516.0, 61470.0, 184951.0, 395256.0, 237882.0, 79263.0, 28677.0, 11311.0, 4860.0, 2288.0, 1168.0, 585.0, 364.0, 198.0, 118.0, 73.0, 42.0, 33.0, 28.0, 14.0, 14.0, 10.0, 8.0, 4.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2083740234375, -0.20252418518066406, -0.19667434692382812, -0.1908245086669922, -0.18497467041015625, -0.1791248321533203, -0.17327499389648438, -0.16742515563964844, -0.1615753173828125, -0.15572547912597656, -0.14987564086914062, -0.1440258026123047, -0.13817596435546875, -0.1323261260986328, -0.12647628784179688, -0.12062644958496094, -0.114776611328125, -0.10892677307128906, -0.10307693481445312, -0.09722709655761719, -0.09137725830078125, -0.08552742004394531, -0.07967758178710938, -0.07382774353027344, -0.0679779052734375, -0.06212806701660156, -0.056278228759765625, -0.05042839050292969, -0.04457855224609375, -0.03872871398925781, -0.032878875732421875, -0.027029037475585938, -0.02117919921875, -0.015329360961914062, -0.009479522705078125, -0.0036296844482421875, 0.00222015380859375, 0.008069992065429688, 0.013919830322265625, 0.019769668579101562, 0.0256195068359375, 0.03146934509277344, 0.037319183349609375, 0.04316902160644531, 0.04901885986328125, 0.05486869812011719, 0.060718536376953125, 0.06656837463378906, 0.072418212890625, 0.07826805114746094, 0.08411788940429688, 0.08996772766113281, 0.09581756591796875, 0.10166740417480469, 0.10751724243164062, 0.11336708068847656, 0.1192169189453125, 0.12506675720214844, 0.13091659545898438, 0.1367664337158203, 0.14261627197265625, 0.1484661102294922, 0.15431594848632812, 0.16016578674316406, 0.166015625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 8.0, 12.0, 12.0, 21.0, 7.0, 18.0, 16.0, 24.0, 41.0, 35.0, 37.0, 42.0, 54.0, 48.0, 51.0, 47.0, 64.0, 48.0, 49.0, 52.0, 46.0, 41.0, 26.0, 31.0, 35.0, 31.0, 17.0, 21.0, 15.0, 11.0, 7.0, 9.0, 6.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.10357666015625, -0.10044479370117188, -0.09731292724609375, -0.09418106079101562, -0.0910491943359375, -0.08791732788085938, -0.08478546142578125, -0.08165359497070312, -0.078521728515625, -0.07538986206054688, -0.07225799560546875, -0.06912612915039062, -0.0659942626953125, -0.06286239624023438, -0.05973052978515625, -0.056598663330078125, -0.053466796875, -0.050334930419921875, -0.04720306396484375, -0.044071197509765625, -0.0409393310546875, -0.037807464599609375, -0.03467559814453125, -0.031543731689453125, -0.028411865234375, -0.025279998779296875, -0.02214813232421875, -0.019016265869140625, -0.0158843994140625, -0.012752532958984375, -0.00962066650390625, -0.006488800048828125, -0.00335693359375, -0.000225067138671875, 0.00290679931640625, 0.006038665771484375, 0.0091705322265625, 0.012302398681640625, 0.01543426513671875, 0.018566131591796875, 0.021697998046875, 0.024829864501953125, 0.02796173095703125, 0.031093597412109375, 0.0342254638671875, 0.037357330322265625, 0.04048919677734375, 0.043621063232421875, 0.0467529296875, 0.049884796142578125, 0.05301666259765625, 0.056148529052734375, 0.0592803955078125, 0.062412261962890625, 0.06554412841796875, 0.06867599487304688, 0.071807861328125, 0.07493972778320312, 0.07807159423828125, 0.08120346069335938, 0.0843353271484375, 0.08746719360351562, 0.09059906005859375, 0.09373092651367188, 0.09686279296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 2.0, 4.0, 6.0, 11.0, 12.0, 28.0, 44.0, 94.0, 107.0, 194.0, 316.0, 644.0, 2113.0, 19508.0, 891560.0, 126942.0, 4766.0, 1123.0, 453.0, 242.0, 151.0, 74.0, 49.0, 34.0, 27.0, 17.0, 8.0, 5.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73095703125, -0.70928955078125, -0.6876220703125, -0.66595458984375, -0.644287109375, -0.62261962890625, -0.6009521484375, -0.57928466796875, -0.5576171875, -0.53594970703125, -0.5142822265625, -0.49261474609375, -0.470947265625, -0.44927978515625, -0.4276123046875, -0.40594482421875, -0.38427734375, -0.36260986328125, -0.3409423828125, -0.31927490234375, -0.297607421875, -0.27593994140625, -0.2542724609375, -0.23260498046875, -0.2109375, -0.18927001953125, -0.1676025390625, -0.14593505859375, -0.124267578125, -0.10260009765625, -0.0809326171875, -0.05926513671875, -0.03759765625, -0.01593017578125, 0.0057373046875, 0.02740478515625, 0.049072265625, 0.07073974609375, 0.0924072265625, 0.11407470703125, 0.1357421875, 0.15740966796875, 0.1790771484375, 0.20074462890625, 0.222412109375, 0.24407958984375, 0.2657470703125, 0.28741455078125, 0.30908203125, 0.33074951171875, 0.3524169921875, 0.37408447265625, 0.395751953125, 0.41741943359375, 0.4390869140625, 0.46075439453125, 0.482421875, 0.50408935546875, 0.5257568359375, 0.54742431640625, 0.569091796875, 0.59075927734375, 0.6124267578125, 0.63409423828125, 0.65576171875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 16.0, 16.0, 21.0, 29.0, 28.0, 40.0, 48.0, 65.0, 66.0, 74.0, 67.0, 83.0, 72.0, 77.0, 66.0, 53.0, 44.0, 41.0, 20.0, 19.0, 14.0, 10.0, 5.0, 10.0, 11.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4106407165527344, -0.39379119873046875, -0.3769416809082031, -0.3600921630859375, -0.3432426452636719, -0.32639312744140625, -0.3095436096191406, -0.292694091796875, -0.2758445739746094, -0.25899505615234375, -0.24214553833007812, -0.2252960205078125, -0.20844650268554688, -0.19159698486328125, -0.17474746704101562, -0.15789794921875, -0.14104843139648438, -0.12419891357421875, -0.10734939575195312, -0.0904998779296875, -0.07365036010742188, -0.05680084228515625, -0.039951324462890625, -0.023101806640625, -0.006252288818359375, 0.01059722900390625, 0.027446746826171875, 0.0442962646484375, 0.061145782470703125, 0.07799530029296875, 0.09484481811523438, 0.1116943359375, 0.12854385375976562, 0.14539337158203125, 0.16224288940429688, 0.1790924072265625, 0.19594192504882812, 0.21279144287109375, 0.22964096069335938, 0.246490478515625, 0.2633399963378906, 0.28018951416015625, 0.2970390319824219, 0.3138885498046875, 0.3307380676269531, 0.34758758544921875, 0.3644371032714844, 0.38128662109375, 0.3981361389160156, 0.41498565673828125, 0.4318351745605469, 0.4486846923828125, 0.4655342102050781, 0.48238372802734375, 0.4992332458496094, 0.516082763671875, 0.5329322814941406, 0.5497817993164062, 0.5666313171386719, 0.5834808349609375, 0.6003303527832031, 0.6171798706054688, 0.6340293884277344, 0.65087890625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 13.0, 22.0, 10.0, 34.0, 68.0, 104.0, 256.0, 619.0, 1839.0, 9058.0, 100465.0, 854285.0, 71898.0, 7202.0, 1641.0, 548.0, 231.0, 97.0, 61.0, 35.0, 15.0, 15.0, 7.0, 8.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.139892578125, -0.1357097625732422, -0.13152694702148438, -0.12734413146972656, -0.12316131591796875, -0.11897850036621094, -0.11479568481445312, -0.11061286926269531, -0.1064300537109375, -0.10224723815917969, -0.09806442260742188, -0.09388160705566406, -0.08969879150390625, -0.08551597595214844, -0.08133316040039062, -0.07715034484863281, -0.072967529296875, -0.06878471374511719, -0.06460189819335938, -0.06041908264160156, -0.05623626708984375, -0.05205345153808594, -0.047870635986328125, -0.04368782043457031, -0.0395050048828125, -0.03532218933105469, -0.031139373779296875, -0.026956558227539062, -0.02277374267578125, -0.018590927124023438, -0.014408111572265625, -0.010225296020507812, -0.00604248046875, -0.0018596649169921875, 0.002323150634765625, 0.0065059661865234375, 0.01068878173828125, 0.014871597290039062, 0.019054412841796875, 0.023237228393554688, 0.0274200439453125, 0.03160285949707031, 0.035785675048828125, 0.03996849060058594, 0.04415130615234375, 0.04833412170410156, 0.052516937255859375, 0.05669975280761719, 0.060882568359375, 0.06506538391113281, 0.06924819946289062, 0.07343101501464844, 0.07761383056640625, 0.08179664611816406, 0.08597946166992188, 0.09016227722167969, 0.0943450927734375, 0.09852790832519531, 0.10271072387695312, 0.10689353942871094, 0.11107635498046875, 0.11525917053222656, 0.11944198608398438, 0.12362480163574219, 0.1278076171875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 8.0, 10.0, 6.0, 11.0, 13.0, 35.0, 42.0, 40.0, 79.0, 111.0, 130.0, 135.0, 99.0, 81.0, 65.0, 32.0, 26.0, 18.0, 13.0, 12.0, 10.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3543834686279297e-05, -2.2730790078639984e-05, -2.191774547100067e-05, -2.110470086336136e-05, -2.0291656255722046e-05, -1.9478611648082733e-05, -1.866556704044342e-05, -1.7852522432804108e-05, -1.7039477825164795e-05, -1.6226433217525482e-05, -1.541338860988617e-05, -1.4600344002246857e-05, -1.3787299394607544e-05, -1.2974254786968231e-05, -1.2161210179328918e-05, -1.1348165571689606e-05, -1.0535120964050293e-05, -9.72207635641098e-06, -8.909031748771667e-06, -8.095987141132355e-06, -7.282942533493042e-06, -6.469897925853729e-06, -5.6568533182144165e-06, -4.843808710575104e-06, -4.030764102935791e-06, -3.2177194952964783e-06, -2.4046748876571655e-06, -1.5916302800178528e-06, -7.7858567237854e-07, 3.4458935260772705e-08, 8.475035429000854e-07, 1.6605481505393982e-06, 2.473592758178711e-06, 3.2866373658180237e-06, 4.0996819734573364e-06, 4.912726581096649e-06, 5.725771188735962e-06, 6.538815796375275e-06, 7.351860404014587e-06, 8.1649050116539e-06, 8.977949619293213e-06, 9.790994226932526e-06, 1.0604038834571838e-05, 1.1417083442211151e-05, 1.2230128049850464e-05, 1.3043172657489777e-05, 1.385621726512909e-05, 1.4669261872768402e-05, 1.5482306480407715e-05, 1.6295351088047028e-05, 1.710839569568634e-05, 1.7921440303325653e-05, 1.8734484910964966e-05, 1.954752951860428e-05, 2.036057412624359e-05, 2.1173618733882904e-05, 2.1986663341522217e-05, 2.279970794916153e-05, 2.3612752556800842e-05, 2.4425797164440155e-05, 2.5238841772079468e-05, 2.605188637971878e-05, 2.6864930987358093e-05, 2.7677975594997406e-05, 2.849102020263672e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 3.0, 4.0, 5.0, 4.0, 10.0, 17.0, 29.0, 58.0, 97.0, 182.0, 429.0, 994.0, 3313.0, 18386.0, 311122.0, 674875.0, 32131.0, 4632.0, 1306.0, 486.0, 215.0, 104.0, 63.0, 32.0, 20.0, 19.0, 6.0, 6.0, 4.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1221923828125, -0.11732864379882812, -0.11246490478515625, -0.10760116577148438, -0.1027374267578125, -0.09787368774414062, -0.09300994873046875, -0.08814620971679688, -0.083282470703125, -0.07841873168945312, -0.07355499267578125, -0.06869125366210938, -0.0638275146484375, -0.058963775634765625, -0.05410003662109375, -0.049236297607421875, -0.04437255859375, -0.039508819580078125, -0.03464508056640625, -0.029781341552734375, -0.0249176025390625, -0.020053863525390625, -0.01519012451171875, -0.010326385498046875, -0.005462646484375, -0.000598907470703125, 0.00426483154296875, 0.009128570556640625, 0.0139923095703125, 0.018856048583984375, 0.02371978759765625, 0.028583526611328125, 0.033447265625, 0.038311004638671875, 0.04317474365234375, 0.048038482666015625, 0.0529022216796875, 0.057765960693359375, 0.06262969970703125, 0.06749343872070312, 0.072357177734375, 0.07722091674804688, 0.08208465576171875, 0.08694839477539062, 0.0918121337890625, 0.09667587280273438, 0.10153961181640625, 0.10640335083007812, 0.11126708984375, 0.11613082885742188, 0.12099456787109375, 0.12585830688476562, 0.1307220458984375, 0.13558578491210938, 0.14044952392578125, 0.14531326293945312, 0.150177001953125, 0.15504074096679688, 0.15990447998046875, 0.16476821899414062, 0.1696319580078125, 0.17449569702148438, 0.17935943603515625, 0.18422317504882812, 0.1890869140625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 6.0, 7.0, 13.0, 15.0, 19.0, 24.0, 41.0, 45.0, 69.0, 90.0, 104.0, 114.0, 116.0, 87.0, 87.0, 41.0, 43.0, 25.0, 8.0, 15.0, 8.0, 7.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10205078125, -0.09820938110351562, -0.09436798095703125, -0.09052658081054688, -0.0866851806640625, -0.08284378051757812, -0.07900238037109375, -0.07516098022460938, -0.071319580078125, -0.06747817993164062, -0.06363677978515625, -0.059795379638671875, -0.0559539794921875, -0.052112579345703125, -0.04827117919921875, -0.044429779052734375, -0.04058837890625, -0.036746978759765625, -0.03290557861328125, -0.029064178466796875, -0.0252227783203125, -0.021381378173828125, -0.01753997802734375, -0.013698577880859375, -0.009857177734375, -0.006015777587890625, -0.00217437744140625, 0.001667022705078125, 0.0055084228515625, 0.009349822998046875, 0.01319122314453125, 0.017032623291015625, 0.0208740234375, 0.024715423583984375, 0.02855682373046875, 0.032398223876953125, 0.0362396240234375, 0.040081024169921875, 0.04392242431640625, 0.047763824462890625, 0.051605224609375, 0.055446624755859375, 0.05928802490234375, 0.06312942504882812, 0.0669708251953125, 0.07081222534179688, 0.07465362548828125, 0.07849502563476562, 0.08233642578125, 0.08617782592773438, 0.09001922607421875, 0.09386062622070312, 0.0977020263671875, 0.10154342651367188, 0.10538482666015625, 0.10922622680664062, 0.113067626953125, 0.11690902709960938, 0.12075042724609375, 0.12459182739257812, 0.1284332275390625, 0.13227462768554688, 0.13611602783203125, 0.13995742797851562, 0.143798828125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 13.0, 24.0, 110.0, 288.0, 358.0, 142.0, 49.0, 15.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.113621711730957, -8.91662311553955, -8.719624519348145, -8.522625923156738, -8.325627326965332, -8.128628730773926, -7.931630611419678, -7.7346320152282715, -7.537633419036865, -7.340634822845459, -7.143636226654053, -6.9466376304626465, -6.749639511108398, -6.552640914916992, -6.355642318725586, -6.15864372253418, -5.961645126342773, -5.764646530151367, -5.567647933959961, -5.370649337768555, -5.173650741577148, -4.9766526222229, -4.779654026031494, -4.582655429840088, -4.385656833648682, -4.188658237457275, -3.991659641265869, -3.794661283493042, -3.5976626873016357, -3.4006640911102295, -3.2036657333374023, -3.006667137145996, -2.809669017791748, -2.612670421600342, -2.4156718254089355, -2.2186734676361084, -2.021674871444702, -1.824676275253296, -1.6276777982711792, -1.4306793212890625, -1.2336807250976562, -1.03668212890625, -0.8396836519241333, -0.6426851153373718, -0.44568657875061035, -0.24868804216384888, -0.0516895055770874, 0.1453089714050293, 0.34230756759643555, 0.539306104183197, 0.7363046407699585, 0.93330317735672, 1.1303017139434814, 1.3273003101348877, 1.5242987871170044, 1.721297264099121, 1.9182958602905273, 2.1152944564819336, 2.31229305267334, 2.509291410446167, 2.7062900066375732, 2.9032886028289795, 3.1002869606018066, 3.297285556793213, 3.494284152984619]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 6.0, 2.0, 3.0, 11.0, 9.0, 6.0, 13.0, 19.0, 16.0, 22.0, 12.0, 20.0, 21.0, 19.0, 33.0, 36.0, 35.0, 41.0, 37.0, 43.0, 44.0, 61.0, 52.0, 51.0, 39.0, 43.0, 35.0, 31.0, 25.0, 29.0, 23.0, 38.0, 24.0, 26.0, 17.0, 14.0, 13.0, 2.0, 7.0, 7.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5337650775909424, -1.4867222309112549, -1.4396793842315674, -1.3926365375518799, -1.3455935716629028, -1.2985507249832153, -1.2515078783035278, -1.2044650316238403, -1.1574220657348633, -1.1103792190551758, -1.0633363723754883, -1.0162935256958008, -0.9692505598068237, -0.9222077131271362, -0.8751648664474487, -0.8281220197677612, -0.7810791730880737, -0.7340363264083862, -0.686993420124054, -0.6399505734443665, -0.5929076671600342, -0.5458648204803467, -0.4988219738006592, -0.4517790973186493, -0.4047362208366394, -0.3576933443546295, -0.31065046787261963, -0.26360762119293213, -0.21656474471092224, -0.16952186822891235, -0.12247902154922485, -0.07543614506721497, -0.028393149375915527, 0.018649719655513763, 0.06569258868694305, 0.11273545026779175, 0.15977832674980164, 0.20682120323181152, 0.253864049911499, 0.3009069263935089, 0.3479498028755188, 0.3949926793575287, 0.4420355558395386, 0.4890784025192261, 0.5361212491989136, 0.5831641554832458, 0.6302070021629333, 0.6772499084472656, 0.7242927551269531, 0.7713356018066406, 0.8183785080909729, 0.8654213547706604, 0.9124642610549927, 0.9595071077346802, 1.0065499544143677, 1.0535928010940552, 1.1006357669830322, 1.1476786136627197, 1.1947214603424072, 1.2417643070220947, 1.2888072729110718, 1.3358501195907593, 1.3828929662704468, 1.4299358129501343, 1.4769786596298218]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 4.0, 4.0, 10.0, 14.0, 21.0, 28.0, 30.0, 71.0, 93.0, 182.0, 323.0, 691.0, 1757.0, 6613.0, 51909.0, 3965164.0, 151552.0, 11470.0, 2624.0, 881.0, 387.0, 207.0, 92.0, 50.0, 31.0, 27.0, 10.0, 10.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5966796875, -0.5816307067871094, -0.5665817260742188, -0.5515327453613281, -0.5364837646484375, -0.5214347839355469, -0.5063858032226562, -0.4913368225097656, -0.476287841796875, -0.4612388610839844, -0.44618988037109375, -0.4311408996582031, -0.4160919189453125, -0.4010429382324219, -0.38599395751953125, -0.3709449768066406, -0.35589599609375, -0.3408470153808594, -0.32579803466796875, -0.3107490539550781, -0.2957000732421875, -0.2806510925292969, -0.26560211181640625, -0.2505531311035156, -0.235504150390625, -0.22045516967773438, -0.20540618896484375, -0.19035720825195312, -0.1753082275390625, -0.16025924682617188, -0.14521026611328125, -0.13016128540039062, -0.1151123046875, -0.10006332397460938, -0.08501434326171875, -0.06996536254882812, -0.0549163818359375, -0.039867401123046875, -0.02481842041015625, -0.009769439697265625, 0.005279541015625, 0.020328521728515625, 0.03537750244140625, 0.050426483154296875, 0.0654754638671875, 0.08052444458007812, 0.09557342529296875, 0.11062240600585938, 0.12567138671875, 0.14072036743164062, 0.15576934814453125, 0.17081832885742188, 0.1858673095703125, 0.20091629028320312, 0.21596527099609375, 0.23101425170898438, 0.246063232421875, 0.2611122131347656, 0.27616119384765625, 0.2912101745605469, 0.3062591552734375, 0.3213081359863281, 0.33635711669921875, 0.3514060974121094, 0.366455078125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 2.0, 6.0, 10.0, 13.0, 17.0, 20.0, 27.0, 25.0, 35.0, 45.0, 53.0, 64.0, 60.0, 47.0, 62.0, 63.0, 57.0, 65.0, 66.0, 41.0, 46.0, 35.0, 28.0, 29.0, 19.0, 16.0, 13.0, 11.0, 6.0, 11.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09234619140625, -0.08892536163330078, -0.08550453186035156, -0.08208370208740234, -0.07866287231445312, -0.0752420425415039, -0.07182121276855469, -0.06840038299560547, -0.06497955322265625, -0.06155872344970703, -0.05813789367675781, -0.054717063903808594, -0.051296234130859375, -0.047875404357910156, -0.04445457458496094, -0.04103374481201172, -0.0376129150390625, -0.03419208526611328, -0.030771255493164062, -0.027350425720214844, -0.023929595947265625, -0.020508766174316406, -0.017087936401367188, -0.013667106628417969, -0.01024627685546875, -0.006825447082519531, -0.0034046173095703125, 1.621246337890625e-05, 0.003437042236328125, 0.006857872009277344, 0.010278701782226562, 0.013699531555175781, 0.017120361328125, 0.02054119110107422, 0.023962020874023438, 0.027382850646972656, 0.030803680419921875, 0.034224510192871094, 0.03764533996582031, 0.04106616973876953, 0.04448699951171875, 0.04790782928466797, 0.05132865905761719, 0.054749488830566406, 0.058170318603515625, 0.061591148376464844, 0.06501197814941406, 0.06843280792236328, 0.0718536376953125, 0.07527446746826172, 0.07869529724121094, 0.08211612701416016, 0.08553695678710938, 0.0889577865600586, 0.09237861633300781, 0.09579944610595703, 0.09922027587890625, 0.10264110565185547, 0.10606193542480469, 0.1094827651977539, 0.11290359497070312, 0.11632442474365234, 0.11974525451660156, 0.12316608428955078, 0.1265869140625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 3.0, 7.0, 5.0, 9.0, 6.0, 9.0, 18.0, 20.0, 33.0, 25.0, 60.0, 98.0, 205.0, 485.0, 1195.0, 3834.0, 14640.0, 89405.0, 3817153.0, 233224.0, 24807.0, 5936.0, 1857.0, 614.0, 286.0, 130.0, 80.0, 33.0, 19.0, 7.0, 13.0, 15.0, 10.0, 13.0, 7.0, 4.0, 2.0, 4.0, 0.0, 5.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.304931640625, -0.2942924499511719, -0.28365325927734375, -0.2730140686035156, -0.2623748779296875, -0.2517356872558594, -0.24109649658203125, -0.23045730590820312, -0.219818115234375, -0.20917892456054688, -0.19853973388671875, -0.18790054321289062, -0.1772613525390625, -0.16662216186523438, -0.15598297119140625, -0.14534378051757812, -0.13470458984375, -0.12406539916992188, -0.11342620849609375, -0.10278701782226562, -0.0921478271484375, -0.08150863647460938, -0.07086944580078125, -0.060230255126953125, -0.049591064453125, -0.038951873779296875, -0.02831268310546875, -0.017673492431640625, -0.0070343017578125, 0.003604888916015625, 0.01424407958984375, 0.024883270263671875, 0.0355224609375, 0.046161651611328125, 0.05680084228515625, 0.06744003295898438, 0.0780792236328125, 0.08871841430664062, 0.09935760498046875, 0.10999679565429688, 0.120635986328125, 0.13127517700195312, 0.14191436767578125, 0.15255355834960938, 0.1631927490234375, 0.17383193969726562, 0.18447113037109375, 0.19511032104492188, 0.20574951171875, 0.21638870239257812, 0.22702789306640625, 0.23766708374023438, 0.2483062744140625, 0.2589454650878906, 0.26958465576171875, 0.2802238464355469, 0.290863037109375, 0.3015022277832031, 0.31214141845703125, 0.3227806091308594, 0.3334197998046875, 0.3440589904785156, 0.35469818115234375, 0.3653373718261719, 0.3759765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 6.0, 1.0, 6.0, 10.0, 5.0, 20.0, 16.0, 29.0, 25.0, 57.0, 68.0, 194.0, 371.0, 1065.0, 1214.0, 498.0, 204.0, 92.0, 54.0, 23.0, 21.0, 14.0, 8.0, 18.0, 11.0, 8.0, 9.0, 4.0, 6.0, 3.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2252197265625, -0.21773719787597656, -0.21025466918945312, -0.2027721405029297, -0.19528961181640625, -0.1878070831298828, -0.18032455444335938, -0.17284202575683594, -0.1653594970703125, -0.15787696838378906, -0.15039443969726562, -0.1429119110107422, -0.13542938232421875, -0.1279468536376953, -0.12046432495117188, -0.11298179626464844, -0.105499267578125, -0.09801673889160156, -0.09053421020507812, -0.08305168151855469, -0.07556915283203125, -0.06808662414550781, -0.060604095458984375, -0.05312156677246094, -0.0456390380859375, -0.03815650939941406, -0.030673980712890625, -0.023191452026367188, -0.01570892333984375, -0.008226394653320312, -0.000743865966796875, 0.0067386627197265625, 0.01422119140625, 0.021703720092773438, 0.029186248779296875, 0.03666877746582031, 0.04415130615234375, 0.05163383483886719, 0.059116363525390625, 0.06659889221191406, 0.0740814208984375, 0.08156394958496094, 0.08904647827148438, 0.09652900695800781, 0.10401153564453125, 0.11149406433105469, 0.11897659301757812, 0.12645912170410156, 0.133941650390625, 0.14142417907714844, 0.14890670776367188, 0.1563892364501953, 0.16387176513671875, 0.1713542938232422, 0.17883682250976562, 0.18631935119628906, 0.1938018798828125, 0.20128440856933594, 0.20876693725585938, 0.2162494659423828, 0.22373199462890625, 0.2312145233154297, 0.23869705200195312, 0.24617958068847656, 0.253662109375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 7.0, 5.0, 9.0, 5.0, 11.0, 19.0, 41.0, 99.0, 125.0, 205.0, 170.0, 148.0, 68.0, 47.0, 20.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.754014015197754, -2.6829781532287598, -2.6119425296783447, -2.5409066677093506, -2.4698708057403564, -2.3988351821899414, -2.3277993202209473, -2.256763458251953, -2.185727596282959, -2.114691734313965, -2.04365611076355, -1.9726202487945557, -1.9015843868255615, -1.830548644065857, -1.7595129013061523, -1.6884770393371582, -1.6174414157867432, -1.5464056730270386, -1.4753698110580444, -1.4043340682983398, -1.3332982063293457, -1.2622624635696411, -1.1912267208099365, -1.1201908588409424, -1.0491551160812378, -0.9781193137168884, -0.9070835113525391, -0.8360477685928345, -0.7650119662284851, -0.6939761638641357, -0.6229404211044312, -0.5519046187400818, -0.4808688163757324, -0.40983301401138306, -0.3387972414493561, -0.2677614688873291, -0.19672566652297974, -0.12568986415863037, -0.054654091596603394, 0.016381680965423584, 0.08741748332977295, 0.15845327079296112, 0.2294890582561493, 0.30052483081817627, 0.37156063318252563, 0.442596435546875, 0.5136321783065796, 0.584667980670929, 0.6557037830352783, 0.7267395853996277, 0.797775387763977, 0.8688111305236816, 0.939846932888031, 1.0108827352523804, 1.081918478012085, 1.152954339981079, 1.2239900827407837, 1.2950258255004883, 1.3660616874694824, 1.437097430229187, 1.5081331729888916, 1.5791690349578857, 1.6502047777175903, 1.721240520477295, 1.792276382446289]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 8.0, 8.0, 15.0, 10.0, 26.0, 24.0, 18.0, 41.0, 49.0, 50.0, 44.0, 51.0, 50.0, 58.0, 72.0, 53.0, 43.0, 48.0, 45.0, 41.0, 32.0, 35.0, 26.0, 20.0, 24.0, 30.0, 15.0, 13.0, 17.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0023683309555054, -0.9696778059005737, -0.9369872808456421, -0.9042967557907104, -0.8716062307357788, -0.8389157056808472, -0.8062251806259155, -0.7735346555709839, -0.7408441305160522, -0.7081536054611206, -0.675463080406189, -0.6427725553512573, -0.6100820302963257, -0.577391505241394, -0.5447009801864624, -0.5120104551315308, -0.4793199300765991, -0.4466294050216675, -0.41393887996673584, -0.3812483549118042, -0.34855782985687256, -0.3158673048019409, -0.2831767797470093, -0.25048625469207764, -0.217795729637146, -0.18510520458221436, -0.15241467952728271, -0.11972415447235107, -0.08703362941741943, -0.05434310436248779, -0.021652579307556152, 0.011037945747375488, 0.04372835159301758, 0.07641887664794922, 0.10910940170288086, 0.1417999267578125, 0.17449045181274414, 0.20718097686767578, 0.23987150192260742, 0.27256202697753906, 0.3052525520324707, 0.33794307708740234, 0.370633602142334, 0.4033241271972656, 0.43601465225219727, 0.4687051773071289, 0.5013957023620605, 0.5340862274169922, 0.5667767524719238, 0.5994672775268555, 0.6321578025817871, 0.6648483276367188, 0.6975388526916504, 0.730229377746582, 0.7629199028015137, 0.7956104278564453, 0.828300952911377, 0.8609914779663086, 0.8936820030212402, 0.9263725280761719, 0.9590630531311035, 0.9917535781860352, 1.0244441032409668, 1.0571346282958984, 1.08982515335083]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 7.0, 22.0, 15.0, 21.0, 37.0, 52.0, 96.0, 114.0, 187.0, 294.0, 547.0, 1030.0, 2209.0, 5245.0, 13431.0, 38528.0, 117090.0, 309253.0, 344345.0, 141748.0, 46552.0, 16332.0, 6109.0, 2559.0, 1204.0, 605.0, 308.0, 186.0, 127.0, 85.0, 54.0, 31.0, 25.0, 26.0, 15.0, 11.0, 12.0, 6.0, 7.0, 4.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.1982421875, -0.1924266815185547, -0.18661117553710938, -0.18079566955566406, -0.17498016357421875, -0.16916465759277344, -0.16334915161132812, -0.1575336456298828, -0.1517181396484375, -0.1459026336669922, -0.14008712768554688, -0.13427162170410156, -0.12845611572265625, -0.12264060974121094, -0.11682510375976562, -0.11100959777832031, -0.105194091796875, -0.09937858581542969, -0.09356307983398438, -0.08774757385253906, -0.08193206787109375, -0.07611656188964844, -0.07030105590820312, -0.06448554992675781, -0.0586700439453125, -0.05285453796386719, -0.047039031982421875, -0.04122352600097656, -0.03540802001953125, -0.029592514038085938, -0.023777008056640625, -0.017961502075195312, -0.01214599609375, -0.0063304901123046875, -0.000514984130859375, 0.0053005218505859375, 0.01111602783203125, 0.016931533813476562, 0.022747039794921875, 0.028562545776367188, 0.0343780517578125, 0.04019355773925781, 0.046009063720703125, 0.05182456970214844, 0.05764007568359375, 0.06345558166503906, 0.06927108764648438, 0.07508659362792969, 0.080902099609375, 0.08671760559082031, 0.09253311157226562, 0.09834861755371094, 0.10416412353515625, 0.10997962951660156, 0.11579513549804688, 0.12161064147949219, 0.1274261474609375, 0.1332416534423828, 0.13905715942382812, 0.14487266540527344, 0.15068817138671875, 0.15650367736816406, 0.16231918334960938, 0.1681346893310547, 0.1739501953125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 6.0, 8.0, 13.0, 10.0, 18.0, 20.0, 21.0, 21.0, 30.0, 35.0, 46.0, 43.0, 58.0, 57.0, 51.0, 40.0, 54.0, 52.0, 48.0, 55.0, 42.0, 51.0, 42.0, 28.0, 35.0, 23.0, 22.0, 10.0, 11.0, 11.0, 11.0, 11.0, 5.0, 3.0, 6.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09539794921875, -0.0923452377319336, -0.08929252624511719, -0.08623981475830078, -0.08318710327148438, -0.08013439178466797, -0.07708168029785156, -0.07402896881103516, -0.07097625732421875, -0.06792354583740234, -0.06487083435058594, -0.06181812286376953, -0.058765411376953125, -0.05571269989013672, -0.05265998840332031, -0.049607276916503906, -0.0465545654296875, -0.043501853942871094, -0.04044914245605469, -0.03739643096923828, -0.034343719482421875, -0.03129100799560547, -0.028238296508789062, -0.025185585021972656, -0.02213287353515625, -0.019080162048339844, -0.016027450561523438, -0.012974739074707031, -0.009922027587890625, -0.006869316101074219, -0.0038166046142578125, -0.0007638931274414062, 0.002288818359375, 0.005341529846191406, 0.008394241333007812, 0.011446952819824219, 0.014499664306640625, 0.01755237579345703, 0.020605087280273438, 0.023657798767089844, 0.02671051025390625, 0.029763221740722656, 0.03281593322753906, 0.03586864471435547, 0.038921356201171875, 0.04197406768798828, 0.04502677917480469, 0.048079490661621094, 0.0511322021484375, 0.054184913635253906, 0.05723762512207031, 0.06029033660888672, 0.06334304809570312, 0.06639575958251953, 0.06944847106933594, 0.07250118255615234, 0.07555389404296875, 0.07860660552978516, 0.08165931701660156, 0.08471202850341797, 0.08776473999023438, 0.09081745147705078, 0.09387016296386719, 0.0969228744506836, 0.0999755859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 4.0, 5.0, 9.0, 12.0, 11.0, 18.0, 33.0, 35.0, 66.0, 97.0, 147.0, 260.0, 443.0, 924.0, 2131.0, 6504.0, 38871.0, 438871.0, 506983.0, 41931.0, 6901.0, 2160.0, 910.0, 488.0, 269.0, 147.0, 89.0, 67.0, 38.0, 25.0, 29.0, 17.0, 12.0, 10.0, 9.0, 9.0, 8.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.375244140625, -0.3648262023925781, -0.35440826416015625, -0.3439903259277344, -0.3335723876953125, -0.3231544494628906, -0.31273651123046875, -0.3023185729980469, -0.291900634765625, -0.2814826965332031, -0.27106475830078125, -0.2606468200683594, -0.2502288818359375, -0.23981094360351562, -0.22939300537109375, -0.21897506713867188, -0.20855712890625, -0.19813919067382812, -0.18772125244140625, -0.17730331420898438, -0.1668853759765625, -0.15646743774414062, -0.14604949951171875, -0.13563156127929688, -0.125213623046875, -0.11479568481445312, -0.10437774658203125, -0.09395980834960938, -0.0835418701171875, -0.07312393188476562, -0.06270599365234375, -0.052288055419921875, -0.0418701171875, -0.031452178955078125, -0.02103424072265625, -0.010616302490234375, -0.0001983642578125, 0.010219573974609375, 0.02063751220703125, 0.031055450439453125, 0.041473388671875, 0.051891326904296875, 0.06230926513671875, 0.07272720336914062, 0.0831451416015625, 0.09356307983398438, 0.10398101806640625, 0.11439895629882812, 0.12481689453125, 0.13523483276367188, 0.14565277099609375, 0.15607070922851562, 0.1664886474609375, 0.17690658569335938, 0.18732452392578125, 0.19774246215820312, 0.208160400390625, 0.21857833862304688, 0.22899627685546875, 0.23941421508789062, 0.2498321533203125, 0.2602500915527344, 0.27066802978515625, 0.2810859680175781, 0.29150390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 8.0, 3.0, 4.0, 9.0, 7.0, 9.0, 12.0, 10.0, 15.0, 17.0, 21.0, 20.0, 28.0, 27.0, 23.0, 38.0, 47.0, 48.0, 52.0, 36.0, 48.0, 31.0, 55.0, 47.0, 39.0, 36.0, 42.0, 32.0, 28.0, 23.0, 22.0, 32.0, 26.0, 22.0, 16.0, 11.0, 12.0, 11.0, 7.0, 11.0, 5.0, 8.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.3408203125, -0.3315238952636719, -0.32222747802734375, -0.3129310607910156, -0.3036346435546875, -0.2943382263183594, -0.28504180908203125, -0.2757453918457031, -0.266448974609375, -0.2571525573730469, -0.24785614013671875, -0.23855972290039062, -0.2292633056640625, -0.21996688842773438, -0.21067047119140625, -0.20137405395507812, -0.19207763671875, -0.18278121948242188, -0.17348480224609375, -0.16418838500976562, -0.1548919677734375, -0.14559555053710938, -0.13629913330078125, -0.12700271606445312, -0.117706298828125, -0.10840988159179688, -0.09911346435546875, -0.08981704711914062, -0.0805206298828125, -0.07122421264648438, -0.06192779541015625, -0.052631378173828125, -0.0433349609375, -0.034038543701171875, -0.02474212646484375, -0.015445709228515625, -0.0061492919921875, 0.003147125244140625, 0.01244354248046875, 0.021739959716796875, 0.031036376953125, 0.040332794189453125, 0.04962921142578125, 0.058925628662109375, 0.0682220458984375, 0.07751846313476562, 0.08681488037109375, 0.09611129760742188, 0.10540771484375, 0.11470413208007812, 0.12400054931640625, 0.13329696655273438, 0.1425933837890625, 0.15188980102539062, 0.16118621826171875, 0.17048263549804688, 0.179779052734375, 0.18907546997070312, 0.19837188720703125, 0.20766830444335938, 0.2169647216796875, 0.22626113891601562, 0.23555755615234375, 0.24485397338867188, 0.254150390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 3.0, 6.0, 7.0, 12.0, 15.0, 23.0, 40.0, 33.0, 44.0, 67.0, 111.0, 212.0, 434.0, 900.0, 2099.0, 6316.0, 32895.0, 740939.0, 241160.0, 16204.0, 4095.0, 1481.0, 601.0, 329.0, 162.0, 113.0, 79.0, 44.0, 32.0, 28.0, 13.0, 16.0, 9.0, 4.0, 7.0, 4.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1602783203125, -0.15507888793945312, -0.14987945556640625, -0.14468002319335938, -0.1394805908203125, -0.13428115844726562, -0.12908172607421875, -0.12388229370117188, -0.118682861328125, -0.11348342895507812, -0.10828399658203125, -0.10308456420898438, -0.0978851318359375, -0.09268569946289062, -0.08748626708984375, -0.08228683471679688, -0.07708740234375, -0.07188796997070312, -0.06668853759765625, -0.061489105224609375, -0.0562896728515625, -0.051090240478515625, -0.04589080810546875, -0.040691375732421875, -0.035491943359375, -0.030292510986328125, -0.02509307861328125, -0.019893646240234375, -0.0146942138671875, -0.009494781494140625, -0.00429534912109375, 0.000904083251953125, 0.006103515625, 0.011302947998046875, 0.01650238037109375, 0.021701812744140625, 0.0269012451171875, 0.032100677490234375, 0.03730010986328125, 0.042499542236328125, 0.047698974609375, 0.052898406982421875, 0.05809783935546875, 0.06329727172851562, 0.0684967041015625, 0.07369613647460938, 0.07889556884765625, 0.08409500122070312, 0.08929443359375, 0.09449386596679688, 0.09969329833984375, 0.10489273071289062, 0.1100921630859375, 0.11529159545898438, 0.12049102783203125, 0.12569046020507812, 0.130889892578125, 0.13608932495117188, 0.14128875732421875, 0.14648818969726562, 0.1516876220703125, 0.15688705444335938, 0.16208648681640625, 0.16728591918945312, 0.1724853515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 10.0, 6.0, 14.0, 23.0, 59.0, 76.0, 175.0, 203.0, 200.0, 94.0, 61.0, 24.0, 15.0, 15.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.534027099609375e-05, -7.34422355890274e-05, -7.154420018196106e-05, -6.964616477489471e-05, -6.774812936782837e-05, -6.585009396076202e-05, -6.395205855369568e-05, -6.205402314662933e-05, -6.015598773956299e-05, -5.825795233249664e-05, -5.63599169254303e-05, -5.446188151836395e-05, -5.256384611129761e-05, -5.066581070423126e-05, -4.876777529716492e-05, -4.686973989009857e-05, -4.4971704483032227e-05, -4.307366907596588e-05, -4.1175633668899536e-05, -3.927759826183319e-05, -3.7379562854766846e-05, -3.54815274477005e-05, -3.3583492040634155e-05, -3.168545663356781e-05, -2.9787421226501465e-05, -2.788938581943512e-05, -2.5991350412368774e-05, -2.409331500530243e-05, -2.2195279598236084e-05, -2.029724419116974e-05, -1.8399208784103394e-05, -1.650117337703705e-05, -1.4603137969970703e-05, -1.2705102562904358e-05, -1.0807067155838013e-05, -8.909031748771667e-06, -7.010996341705322e-06, -5.112960934638977e-06, -3.214925527572632e-06, -1.3168901205062866e-06, 5.811452865600586e-07, 2.479180693626404e-06, 4.377216100692749e-06, 6.275251507759094e-06, 8.17328691482544e-06, 1.0071322321891785e-05, 1.196935772895813e-05, 1.3867393136024475e-05, 1.576542854309082e-05, 1.7663463950157166e-05, 1.956149935722351e-05, 2.1459534764289856e-05, 2.33575701713562e-05, 2.5255605578422546e-05, 2.715364098548889e-05, 2.9051676392555237e-05, 3.094971179962158e-05, 3.284774720668793e-05, 3.474578261375427e-05, 3.664381802082062e-05, 3.854185342788696e-05, 4.043988883495331e-05, 4.233792424201965e-05, 4.4235959649086e-05, 4.6133995056152344e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 10.0, 24.0, 18.0, 34.0, 68.0, 127.0, 174.0, 430.0, 905.0, 2190.0, 7075.0, 40840.0, 729907.0, 241264.0, 18230.0, 4261.0, 1579.0, 653.0, 321.0, 157.0, 92.0, 54.0, 34.0, 23.0, 11.0, 11.0, 14.0, 8.0, 8.0, 5.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.155517578125, -0.1504688262939453, -0.14542007446289062, -0.14037132263183594, -0.13532257080078125, -0.13027381896972656, -0.12522506713867188, -0.12017631530761719, -0.1151275634765625, -0.11007881164550781, -0.10503005981445312, -0.09998130798339844, -0.09493255615234375, -0.08988380432128906, -0.08483505249023438, -0.07978630065917969, -0.074737548828125, -0.06968879699707031, -0.06464004516601562, -0.05959129333496094, -0.05454254150390625, -0.04949378967285156, -0.044445037841796875, -0.03939628601074219, -0.0343475341796875, -0.029298782348632812, -0.024250030517578125, -0.019201278686523438, -0.01415252685546875, -0.009103775024414062, -0.004055023193359375, 0.0009937286376953125, 0.00604248046875, 0.011091232299804688, 0.016139984130859375, 0.021188735961914062, 0.02623748779296875, 0.03128623962402344, 0.036334991455078125, 0.04138374328613281, 0.0464324951171875, 0.05148124694824219, 0.056529998779296875, 0.06157875061035156, 0.06662750244140625, 0.07167625427246094, 0.07672500610351562, 0.08177375793457031, 0.086822509765625, 0.09187126159667969, 0.09692001342773438, 0.10196876525878906, 0.10701751708984375, 0.11206626892089844, 0.11711502075195312, 0.12216377258300781, 0.1272125244140625, 0.1322612762451172, 0.13731002807617188, 0.14235877990722656, 0.14740753173828125, 0.15245628356933594, 0.15750503540039062, 0.1625537872314453, 0.1676025390625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 9.0, 7.0, 19.0, 43.0, 67.0, 83.0, 148.0, 152.0, 129.0, 105.0, 95.0, 47.0, 25.0, 14.0, 11.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.168212890625, -0.16216087341308594, -0.15610885620117188, -0.1500568389892578, -0.14400482177734375, -0.1379528045654297, -0.13190078735351562, -0.12584877014160156, -0.1197967529296875, -0.11374473571777344, -0.10769271850585938, -0.10164070129394531, -0.09558868408203125, -0.08953666687011719, -0.08348464965820312, -0.07743263244628906, -0.071380615234375, -0.06532859802246094, -0.059276580810546875, -0.05322456359863281, -0.04717254638671875, -0.04112052917480469, -0.035068511962890625, -0.029016494750976562, -0.0229644775390625, -0.016912460327148438, -0.010860443115234375, -0.0048084259033203125, 0.00124359130859375, 0.0072956085205078125, 0.013347625732421875, 0.019399642944335938, 0.02545166015625, 0.03150367736816406, 0.037555694580078125, 0.04360771179199219, 0.04965972900390625, 0.05571174621582031, 0.061763763427734375, 0.06781578063964844, 0.0738677978515625, 0.07991981506347656, 0.08597183227539062, 0.09202384948730469, 0.09807586669921875, 0.10412788391113281, 0.11017990112304688, 0.11623191833496094, 0.122283935546875, 0.12833595275878906, 0.13438796997070312, 0.1404399871826172, 0.14649200439453125, 0.1525440216064453, 0.15859603881835938, 0.16464805603027344, 0.1707000732421875, 0.17675209045410156, 0.18280410766601562, 0.1888561248779297, 0.19490814208984375, 0.2009601593017578, 0.20701217651367188, 0.21306419372558594, 0.2191162109375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 6.0, 13.0, 17.0, 35.0, 65.0, 87.0, 136.0, 213.0, 154.0, 111.0, 70.0, 41.0, 17.0, 11.0, 9.0, 6.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3956902027130127, -2.324364423751831, -2.2530386447906494, -2.1817128658294678, -2.110386848449707, -2.0390610694885254, -1.9677352905273438, -1.896409511566162, -1.8250837326049805, -1.7537579536437988, -1.6824321746826172, -1.611106276512146, -1.5397804975509644, -1.4684547185897827, -1.3971288204193115, -1.3258030414581299, -1.2544772624969482, -1.1831514835357666, -1.111825704574585, -1.0404998064041138, -0.9691740274429321, -0.8978482484817505, -0.8265224099159241, -0.7551965713500977, -0.683870792388916, -0.6125450134277344, -0.541219174861908, -0.46989336609840393, -0.3985675573348999, -0.3272417485713959, -0.25591593980789185, -0.18459013104438782, -0.11326432228088379, -0.04193851351737976, 0.029387295246124268, 0.1007131040096283, 0.17203891277313232, 0.24336472153663635, 0.3146905303001404, 0.3860163390636444, 0.45734214782714844, 0.5286679267883301, 0.5999937653541565, 0.6713196039199829, 0.7426453828811646, 0.8139711618423462, 0.8852970004081726, 0.956622838973999, 1.0279486179351807, 1.0992743968963623, 1.170600175857544, 1.2419260740280151, 1.3132518529891968, 1.3845776319503784, 1.4559035301208496, 1.5272293090820312, 1.598555088043213, 1.6698808670043945, 1.7412066459655762, 1.8125325441360474, 1.883858323097229, 1.9551841020584106, 2.026510000228882, 2.0978357791900635, 2.169161558151245]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 5.0, 10.0, 11.0, 6.0, 21.0, 25.0, 19.0, 28.0, 25.0, 34.0, 35.0, 54.0, 53.0, 58.0, 69.0, 57.0, 71.0, 59.0, 60.0, 40.0, 41.0, 37.0, 39.0, 33.0, 20.0, 12.0, 17.0, 17.0, 11.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0], "bins": [-1.751138687133789, -1.7048673629760742, -1.6585959196090698, -1.612324595451355, -1.5660532712936401, -1.5197818279266357, -1.473510503768921, -1.427239179611206, -1.3809678554534912, -1.3346965312957764, -1.288425087928772, -1.2421537637710571, -1.1958824396133423, -1.149610996246338, -1.103339672088623, -1.0570683479309082, -1.0107969045639038, -0.9645255208015442, -0.9182541966438293, -0.8719828128814697, -0.8257114887237549, -0.7794401049613953, -0.7331687211990356, -0.6868973970413208, -0.6406260132789612, -0.5943546295166016, -0.5480833053588867, -0.5018119215965271, -0.45554056763648987, -0.40926921367645264, -0.362997829914093, -0.3167264759540558, -0.27045512199401855, -0.22418376803398132, -0.1779123991727829, -0.13164103031158447, -0.08536967635154724, -0.03909832239151001, 0.007173061370849609, 0.05344441533088684, 0.09971576929092407, 0.1459871232509613, 0.19225849211215973, 0.23852986097335815, 0.2848012149333954, 0.3310725688934326, 0.37734395265579224, 0.42361530661582947, 0.4698866605758667, 0.5161580443382263, 0.5624293684959412, 0.6087007522583008, 0.6549720764160156, 0.7012434601783752, 0.7475148439407349, 0.7937861680984497, 0.8400575518608093, 0.886328935623169, 0.9326002597808838, 0.9788716435432434, 1.025143027305603, 1.0714143514633179, 1.1176857948303223, 1.163957118988037, 1.210228443145752]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 2.0, 3.0, 3.0, 6.0, 12.0, 18.0, 24.0, 28.0, 28.0, 45.0, 66.0, 89.0, 116.0, 167.0, 294.0, 490.0, 1452.0, 8956.0, 3638004.0, 535778.0, 6372.0, 1167.0, 436.0, 216.0, 131.0, 107.0, 65.0, 43.0, 36.0, 24.0, 27.0, 24.0, 15.0, 10.0, 8.0, 2.0, 5.0, 6.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6884765625, -0.6646575927734375, -0.640838623046875, -0.6170196533203125, -0.59320068359375, -0.5693817138671875, -0.545562744140625, -0.5217437744140625, -0.4979248046875, -0.4741058349609375, -0.450286865234375, -0.4264678955078125, -0.40264892578125, -0.3788299560546875, -0.355010986328125, -0.3311920166015625, -0.307373046875, -0.2835540771484375, -0.259735107421875, -0.2359161376953125, -0.21209716796875, -0.1882781982421875, -0.164459228515625, -0.1406402587890625, -0.1168212890625, -0.0930023193359375, -0.069183349609375, -0.0453643798828125, -0.02154541015625, 0.0022735595703125, 0.026092529296875, 0.0499114990234375, 0.07373046875, 0.0975494384765625, 0.121368408203125, 0.1451873779296875, 0.16900634765625, 0.1928253173828125, 0.216644287109375, 0.2404632568359375, 0.2642822265625, 0.2881011962890625, 0.311920166015625, 0.3357391357421875, 0.35955810546875, 0.3833770751953125, 0.407196044921875, 0.4310150146484375, 0.454833984375, 0.4786529541015625, 0.502471923828125, 0.5262908935546875, 0.55010986328125, 0.5739288330078125, 0.597747802734375, 0.6215667724609375, 0.6453857421875, 0.6692047119140625, 0.693023681640625, 0.7168426513671875, 0.74066162109375, 0.7644805908203125, 0.788299560546875, 0.8121185302734375, 0.8359375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 7.0, 22.0, 24.0, 40.0, 44.0, 83.0, 101.0, 105.0, 104.0, 115.0, 92.0, 83.0, 61.0, 48.0, 25.0, 21.0, 16.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.302734375, -0.2965097427368164, -0.2902851104736328, -0.2840604782104492, -0.2778358459472656, -0.27161121368408203, -0.26538658142089844, -0.25916194915771484, -0.25293731689453125, -0.24671268463134766, -0.24048805236816406, -0.23426342010498047, -0.22803878784179688, -0.22181415557861328, -0.2155895233154297, -0.2093648910522461, -0.2031402587890625, -0.1969156265258789, -0.1906909942626953, -0.18446636199951172, -0.17824172973632812, -0.17201709747314453, -0.16579246520996094, -0.15956783294677734, -0.15334320068359375, -0.14711856842041016, -0.14089393615722656, -0.13466930389404297, -0.12844467163085938, -0.12222003936767578, -0.11599540710449219, -0.1097707748413086, -0.103546142578125, -0.0973215103149414, -0.09109687805175781, -0.08487224578857422, -0.07864761352539062, -0.07242298126220703, -0.06619834899902344, -0.059973716735839844, -0.05374908447265625, -0.047524452209472656, -0.04129981994628906, -0.03507518768310547, -0.028850555419921875, -0.02262592315673828, -0.016401290893554688, -0.010176658630371094, -0.0039520263671875, 0.0022726058959960938, 0.008497238159179688, 0.014721870422363281, 0.020946502685546875, 0.02717113494873047, 0.03339576721191406, 0.039620399475097656, 0.04584503173828125, 0.052069664001464844, 0.05829429626464844, 0.06451892852783203, 0.07074356079101562, 0.07696819305419922, 0.08319282531738281, 0.0894174575805664, 0.09564208984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 16.0, 8.0, 28.0, 41.0, 58.0, 121.0, 182.0, 342.0, 623.0, 1505.0, 3698.0, 11605.0, 58815.0, 3232920.0, 833589.0, 37021.0, 8646.0, 2810.0, 1092.0, 510.0, 269.0, 141.0, 79.0, 56.0, 37.0, 27.0, 15.0, 10.0, 8.0, 6.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.323974609375, -0.3131294250488281, -0.30228424072265625, -0.2914390563964844, -0.2805938720703125, -0.2697486877441406, -0.25890350341796875, -0.24805831909179688, -0.237213134765625, -0.22636795043945312, -0.21552276611328125, -0.20467758178710938, -0.1938323974609375, -0.18298721313476562, -0.17214202880859375, -0.16129684448242188, -0.15045166015625, -0.13960647583007812, -0.12876129150390625, -0.11791610717773438, -0.1070709228515625, -0.09622573852539062, -0.08538055419921875, -0.07453536987304688, -0.063690185546875, -0.052845001220703125, -0.04199981689453125, -0.031154632568359375, -0.0203094482421875, -0.009464263916015625, 0.00138092041015625, 0.012226104736328125, 0.0230712890625, 0.033916473388671875, 0.04476165771484375, 0.055606842041015625, 0.0664520263671875, 0.07729721069335938, 0.08814239501953125, 0.09898757934570312, 0.109832763671875, 0.12067794799804688, 0.13152313232421875, 0.14236831665039062, 0.1532135009765625, 0.16405868530273438, 0.17490386962890625, 0.18574905395507812, 0.19659423828125, 0.20743942260742188, 0.21828460693359375, 0.22912979125976562, 0.2399749755859375, 0.2508201599121094, 0.26166534423828125, 0.2725105285644531, 0.283355712890625, 0.2942008972167969, 0.30504608154296875, 0.3158912658691406, 0.3267364501953125, 0.3375816345214844, 0.34842681884765625, 0.3592720031738281, 0.3701171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 11.0, 20.0, 26.0, 55.0, 83.0, 200.0, 674.0, 1530.0, 911.0, 248.0, 107.0, 57.0, 42.0, 22.0, 17.0, 10.0, 6.0, 7.0, 11.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.334716796875, -0.3250465393066406, -0.31537628173828125, -0.3057060241699219, -0.2960357666015625, -0.2863655090332031, -0.27669525146484375, -0.2670249938964844, -0.257354736328125, -0.24768447875976562, -0.23801422119140625, -0.22834396362304688, -0.2186737060546875, -0.20900344848632812, -0.19933319091796875, -0.18966293334960938, -0.17999267578125, -0.17032241821289062, -0.16065216064453125, -0.15098190307617188, -0.1413116455078125, -0.13164138793945312, -0.12197113037109375, -0.11230087280273438, -0.102630615234375, -0.09296035766601562, -0.08329010009765625, -0.07361984252929688, -0.0639495849609375, -0.054279327392578125, -0.04460906982421875, -0.034938812255859375, -0.0252685546875, -0.015598297119140625, -0.00592803955078125, 0.003742218017578125, 0.0134124755859375, 0.023082733154296875, 0.03275299072265625, 0.042423248291015625, 0.052093505859375, 0.061763763427734375, 0.07143402099609375, 0.08110427856445312, 0.0907745361328125, 0.10044479370117188, 0.11011505126953125, 0.11978530883789062, 0.12945556640625, 0.13912582397460938, 0.14879608154296875, 0.15846633911132812, 0.1681365966796875, 0.17780685424804688, 0.18747711181640625, 0.19714736938476562, 0.206817626953125, 0.21648788452148438, 0.22615814208984375, 0.23582839965820312, 0.2454986572265625, 0.2551689147949219, 0.26483917236328125, 0.2745094299316406, 0.2841796875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 10.0, 31.0, 80.0, 173.0, 268.0, 250.0, 107.0, 33.0, 24.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.657840728759766, -4.562611103057861, -4.467381954193115, -4.372152328491211, -4.276923179626465, -4.1816935539245605, -4.086463928222656, -3.99123477935791, -3.896005153656006, -3.8007757663726807, -3.7055463790893555, -3.610316753387451, -3.515087366104126, -3.419857978820801, -3.3246285915374756, -3.2293992042541504, -3.134169578552246, -3.038940191268921, -2.9437108039855957, -2.8484811782836914, -2.753251791000366, -2.658022403717041, -2.562793016433716, -2.4675636291503906, -2.3723342418670654, -2.2771048545837402, -2.181875467300415, -2.0866458415985107, -1.9914164543151855, -1.8961870670318604, -1.8009576797485352, -1.7057281732559204, -1.6104986667633057, -1.5152692794799805, -1.4200397729873657, -1.3248103857040405, -1.2295808792114258, -1.1343514919281006, -1.0391221046447754, -0.9438925981521606, -0.8486631512641907, -0.7534337043762207, -0.6582042574882507, -0.5629748106002808, -0.4677453935146332, -0.3725159466266632, -0.2772865295410156, -0.18205708265304565, -0.08682763576507568, 0.00840180367231369, 0.10363124310970306, 0.19886067509651184, 0.2940901219844818, 0.3893195688724518, 0.48454898595809937, 0.5797784328460693, 0.6750078797340393, 0.7702373266220093, 0.8654667735099792, 0.9606962203979492, 1.0559256076812744, 1.1511551141738892, 1.2463845014572144, 1.341614007949829, 1.4368433952331543]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 7.0, 5.0, 6.0, 7.0, 16.0, 19.0, 28.0, 28.0, 34.0, 46.0, 56.0, 69.0, 62.0, 58.0, 71.0, 78.0, 67.0, 71.0, 52.0, 53.0, 39.0, 37.0, 24.0, 20.0, 19.0, 7.0, 7.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8536587357521057, -0.8142216205596924, -0.774784505367279, -0.7353473901748657, -0.6959102153778076, -0.6564731597900391, -0.617035984992981, -0.5775988698005676, -0.5381617546081543, -0.49872463941574097, -0.45928752422332764, -0.4198503792285919, -0.3804132640361786, -0.34097614884376526, -0.30153900384902954, -0.2621018886566162, -0.22266477346420288, -0.18322765827178955, -0.14379052817821503, -0.1043534055352211, -0.06491628289222717, -0.025479167699813843, 0.013957962393760681, 0.053395092487335205, 0.09283220767974854, 0.13226932287216187, 0.1717064529657364, 0.2111435830593109, 0.25058069825172424, 0.2900178134441376, 0.3294549584388733, 0.3688920736312866, 0.4083291292190552, 0.4477662444114685, 0.48720335960388184, 0.5266404747962952, 0.5660775899887085, 0.6055147647857666, 0.6449518799781799, 0.6843889951705933, 0.7238261103630066, 0.7632632255554199, 0.8027003407478333, 0.8421374559402466, 0.8815746307373047, 0.9210116863250732, 0.9604488611221313, 0.9998859763145447, 1.039323091506958, 1.0787602663040161, 1.1181973218917847, 1.1576344966888428, 1.1970715522766113, 1.2365087270736694, 1.275945782661438, 1.315382957458496, 1.3548200130462646, 1.3942571878433228, 1.4336942434310913, 1.4731314182281494, 1.512568473815918, 1.552005648612976, 1.5914427042007446, 1.6308798789978027, 1.6703170537948608]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 14.0, 10.0, 17.0, 24.0, 37.0, 56.0, 84.0, 105.0, 180.0, 274.0, 439.0, 733.0, 1234.0, 2305.0, 4298.0, 8807.0, 18647.0, 41486.0, 95343.0, 206474.0, 295136.0, 203043.0, 92970.0, 40223.0, 18171.0, 8634.0, 4319.0, 2306.0, 1211.0, 700.0, 423.0, 273.0, 168.0, 116.0, 76.0, 48.0, 41.0, 36.0, 22.0, 19.0, 10.0, 12.0, 5.0, 5.0, 5.0, 2.0, 4.0, 0.0, 2.0], "bins": [-0.1634521484375, -0.1588459014892578, -0.15423965454101562, -0.14963340759277344, -0.14502716064453125, -0.14042091369628906, -0.13581466674804688, -0.1312084197998047, -0.1266021728515625, -0.12199592590332031, -0.11738967895507812, -0.11278343200683594, -0.10817718505859375, -0.10357093811035156, -0.09896469116210938, -0.09435844421386719, -0.089752197265625, -0.08514595031738281, -0.08053970336914062, -0.07593345642089844, -0.07132720947265625, -0.06672096252441406, -0.062114715576171875, -0.05750846862792969, -0.0529022216796875, -0.04829597473144531, -0.043689727783203125, -0.03908348083496094, -0.03447723388671875, -0.029870986938476562, -0.025264739990234375, -0.020658493041992188, -0.01605224609375, -0.011445999145507812, -0.006839752197265625, -0.0022335052490234375, 0.00237274169921875, 0.0069789886474609375, 0.011585235595703125, 0.016191482543945312, 0.0207977294921875, 0.025403976440429688, 0.030010223388671875, 0.03461647033691406, 0.03922271728515625, 0.04382896423339844, 0.048435211181640625, 0.05304145812988281, 0.057647705078125, 0.06225395202636719, 0.06686019897460938, 0.07146644592285156, 0.07607269287109375, 0.08067893981933594, 0.08528518676757812, 0.08989143371582031, 0.0944976806640625, 0.09910392761230469, 0.10371017456054688, 0.10831642150878906, 0.11292266845703125, 0.11752891540527344, 0.12213516235351562, 0.1267414093017578, 0.13134765625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 5.0, 6.0, 8.0, 9.0, 9.0, 12.0, 24.0, 27.0, 33.0, 30.0, 48.0, 41.0, 61.0, 49.0, 53.0, 41.0, 63.0, 65.0, 52.0, 54.0, 44.0, 32.0, 44.0, 30.0, 22.0, 25.0, 31.0, 13.0, 18.0, 14.0, 7.0, 7.0, 7.0, 3.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11358642578125, -0.11029434204101562, -0.10700225830078125, -0.10371017456054688, -0.1004180908203125, -0.09712600708007812, -0.09383392333984375, -0.09054183959960938, -0.087249755859375, -0.08395767211914062, -0.08066558837890625, -0.07737350463867188, -0.0740814208984375, -0.07078933715820312, -0.06749725341796875, -0.06420516967773438, -0.0609130859375, -0.057621002197265625, -0.05432891845703125, -0.051036834716796875, -0.0477447509765625, -0.044452667236328125, -0.04116058349609375, -0.037868499755859375, -0.034576416015625, -0.031284332275390625, -0.02799224853515625, -0.024700164794921875, -0.0214080810546875, -0.018115997314453125, -0.01482391357421875, -0.011531829833984375, -0.00823974609375, -0.004947662353515625, -0.00165557861328125, 0.001636505126953125, 0.0049285888671875, 0.008220672607421875, 0.01151275634765625, 0.014804840087890625, 0.018096923828125, 0.021389007568359375, 0.02468109130859375, 0.027973175048828125, 0.0312652587890625, 0.034557342529296875, 0.03784942626953125, 0.041141510009765625, 0.04443359375, 0.047725677490234375, 0.05101776123046875, 0.054309844970703125, 0.0576019287109375, 0.060894012451171875, 0.06418609619140625, 0.06747817993164062, 0.070770263671875, 0.07406234741210938, 0.07735443115234375, 0.08064651489257812, 0.0839385986328125, 0.08723068237304688, 0.09052276611328125, 0.09381484985351562, 0.09710693359375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 10.0, 13.0, 10.0, 14.0, 35.0, 36.0, 42.0, 92.0, 198.0, 322.0, 692.0, 1812.0, 7212.0, 55193.0, 650633.0, 300849.0, 24823.0, 4161.0, 1250.0, 520.0, 261.0, 129.0, 92.0, 57.0, 29.0, 26.0, 11.0, 5.0, 4.0, 9.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.35595703125, -0.3436088562011719, -0.33126068115234375, -0.3189125061035156, -0.3065643310546875, -0.2942161560058594, -0.28186798095703125, -0.2695198059082031, -0.257171630859375, -0.24482345581054688, -0.23247528076171875, -0.22012710571289062, -0.2077789306640625, -0.19543075561523438, -0.18308258056640625, -0.17073440551757812, -0.15838623046875, -0.14603805541992188, -0.13368988037109375, -0.12134170532226562, -0.1089935302734375, -0.09664535522460938, -0.08429718017578125, -0.07194900512695312, -0.059600830078125, -0.047252655029296875, -0.03490447998046875, -0.022556304931640625, -0.0102081298828125, 0.002140045166015625, 0.01448822021484375, 0.026836395263671875, 0.0391845703125, 0.051532745361328125, 0.06388092041015625, 0.07622909545898438, 0.0885772705078125, 0.10092544555664062, 0.11327362060546875, 0.12562179565429688, 0.137969970703125, 0.15031814575195312, 0.16266632080078125, 0.17501449584960938, 0.1873626708984375, 0.19971084594726562, 0.21205902099609375, 0.22440719604492188, 0.23675537109375, 0.24910354614257812, 0.26145172119140625, 0.2737998962402344, 0.2861480712890625, 0.2984962463378906, 0.31084442138671875, 0.3231925964355469, 0.335540771484375, 0.3478889465332031, 0.36023712158203125, 0.3725852966308594, 0.3849334716796875, 0.3972816467285156, 0.40962982177734375, 0.4219779968261719, 0.434326171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 7.0, 6.0, 9.0, 13.0, 15.0, 13.0, 23.0, 27.0, 27.0, 27.0, 37.0, 33.0, 45.0, 51.0, 50.0, 49.0, 61.0, 54.0, 49.0, 62.0, 49.0, 48.0, 38.0, 36.0, 25.0, 31.0, 15.0, 13.0, 18.0, 13.0, 4.0, 7.0, 14.0, 6.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.28466796875, -0.2737998962402344, -0.26293182373046875, -0.2520637512207031, -0.2411956787109375, -0.23032760620117188, -0.21945953369140625, -0.20859146118164062, -0.197723388671875, -0.18685531616210938, -0.17598724365234375, -0.16511917114257812, -0.1542510986328125, -0.14338302612304688, -0.13251495361328125, -0.12164688110351562, -0.11077880859375, -0.09991073608398438, -0.08904266357421875, -0.07817459106445312, -0.0673065185546875, -0.056438446044921875, -0.04557037353515625, -0.034702301025390625, -0.023834228515625, -0.012966156005859375, -0.00209808349609375, 0.008769989013671875, 0.0196380615234375, 0.030506134033203125, 0.04137420654296875, 0.052242279052734375, 0.0631103515625, 0.07397842407226562, 0.08484649658203125, 0.09571456909179688, 0.1065826416015625, 0.11745071411132812, 0.12831878662109375, 0.13918685913085938, 0.150054931640625, 0.16092300415039062, 0.17179107666015625, 0.18265914916992188, 0.1935272216796875, 0.20439529418945312, 0.21526336669921875, 0.22613143920898438, 0.23699951171875, 0.24786758422851562, 0.25873565673828125, 0.2696037292480469, 0.2804718017578125, 0.2913398742675781, 0.30220794677734375, 0.3130760192871094, 0.323944091796875, 0.3348121643066406, 0.34568023681640625, 0.3565483093261719, 0.3674163818359375, 0.3782844543457031, 0.38915252685546875, 0.4000205993652344, 0.410888671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 4.0, 6.0, 12.0, 13.0, 25.0, 36.0, 47.0, 97.0, 105.0, 182.0, 277.0, 471.0, 962.0, 2214.0, 6106.0, 23374.0, 187523.0, 729243.0, 76713.0, 13594.0, 4066.0, 1641.0, 774.0, 378.0, 222.0, 165.0, 81.0, 63.0, 51.0, 28.0, 22.0, 19.0, 11.0, 4.0, 4.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.2010498046875, -0.1958026885986328, -0.19055557250976562, -0.18530845642089844, -0.18006134033203125, -0.17481422424316406, -0.16956710815429688, -0.1643199920654297, -0.1590728759765625, -0.1538257598876953, -0.14857864379882812, -0.14333152770996094, -0.13808441162109375, -0.13283729553222656, -0.12759017944335938, -0.12234306335449219, -0.117095947265625, -0.11184883117675781, -0.10660171508789062, -0.10135459899902344, -0.09610748291015625, -0.09086036682128906, -0.08561325073242188, -0.08036613464355469, -0.0751190185546875, -0.06987190246582031, -0.06462478637695312, -0.05937767028808594, -0.05413055419921875, -0.04888343811035156, -0.043636322021484375, -0.03838920593261719, -0.03314208984375, -0.027894973754882812, -0.022647857666015625, -0.017400741577148438, -0.01215362548828125, -0.0069065093994140625, -0.001659393310546875, 0.0035877227783203125, 0.0088348388671875, 0.014081954956054688, 0.019329071044921875, 0.024576187133789062, 0.02982330322265625, 0.03507041931152344, 0.040317535400390625, 0.04556465148925781, 0.050811767578125, 0.05605888366699219, 0.061305999755859375, 0.06655311584472656, 0.07180023193359375, 0.07704734802246094, 0.08229446411132812, 0.08754158020019531, 0.0927886962890625, 0.09803581237792969, 0.10328292846679688, 0.10853004455566406, 0.11377716064453125, 0.11902427673339844, 0.12427139282226562, 0.1295185089111328, 0.134765625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 6.0, 5.0, 18.0, 53.0, 246.0, 480.0, 132.0, 32.0, 10.0, 5.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0002593994140625, -0.00025367550551891327, -0.00024795159697532654, -0.0002422276884317398, -0.00023650377988815308, -0.00023077987134456635, -0.00022505596280097961, -0.00021933205425739288, -0.00021360814571380615, -0.00020788423717021942, -0.0002021603286266327, -0.00019643642008304596, -0.00019071251153945923, -0.0001849886029958725, -0.00017926469445228577, -0.00017354078590869904, -0.0001678168773651123, -0.00016209296882152557, -0.00015636906027793884, -0.0001506451517343521, -0.00014492124319076538, -0.00013919733464717865, -0.00013347342610359192, -0.0001277495175600052, -0.00012202560901641846, -0.00011630170047283173, -0.000110577791929245, -0.00010485388338565826, -9.912997484207153e-05, -9.34060662984848e-05, -8.768215775489807e-05, -8.195824921131134e-05, -7.623434066772461e-05, -7.051043212413788e-05, -6.478652358055115e-05, -5.9062615036964417e-05, -5.3338706493377686e-05, -4.7614797949790955e-05, -4.1890889406204224e-05, -3.616698086261749e-05, -3.0443072319030762e-05, -2.471916377544403e-05, -1.89952552318573e-05, -1.3271346688270569e-05, -7.547438144683838e-06, -1.823529601097107e-06, 3.900378942489624e-06, 9.624287486076355e-06, 1.5348196029663086e-05, 2.1072104573249817e-05, 2.6796013116836548e-05, 3.251992166042328e-05, 3.824383020401001e-05, 4.396773874759674e-05, 4.969164729118347e-05, 5.54155558347702e-05, 6.113946437835693e-05, 6.686337292194366e-05, 7.25872814655304e-05, 7.831119000911713e-05, 8.403509855270386e-05, 8.975900709629059e-05, 9.548291563987732e-05, 0.00010120682418346405, 0.00010693073272705078]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 9.0, 12.0, 15.0, 19.0, 22.0, 35.0, 70.0, 115.0, 225.0, 424.0, 993.0, 2647.0, 8784.0, 38235.0, 264457.0, 622620.0, 86497.0, 16139.0, 4303.0, 1618.0, 646.0, 331.0, 134.0, 65.0, 46.0, 28.0, 24.0, 16.0, 9.0, 6.0, 5.0, 6.0, 5.0, 0.0, 1.0, 1.0], "bins": [-0.1986083984375, -0.1940135955810547, -0.18941879272460938, -0.18482398986816406, -0.18022918701171875, -0.17563438415527344, -0.17103958129882812, -0.1664447784423828, -0.1618499755859375, -0.1572551727294922, -0.15266036987304688, -0.14806556701660156, -0.14347076416015625, -0.13887596130371094, -0.13428115844726562, -0.1296863555908203, -0.125091552734375, -0.12049674987792969, -0.11590194702148438, -0.11130714416503906, -0.10671234130859375, -0.10211753845214844, -0.09752273559570312, -0.09292793273925781, -0.0883331298828125, -0.08373832702636719, -0.07914352416992188, -0.07454872131347656, -0.06995391845703125, -0.06535911560058594, -0.060764312744140625, -0.05616950988769531, -0.05157470703125, -0.04697990417480469, -0.042385101318359375, -0.03779029846191406, -0.03319549560546875, -0.028600692749023438, -0.024005889892578125, -0.019411087036132812, -0.0148162841796875, -0.010221481323242188, -0.005626678466796875, -0.0010318756103515625, 0.00356292724609375, 0.008157730102539062, 0.012752532958984375, 0.017347335815429688, 0.021942138671875, 0.026536941528320312, 0.031131744384765625, 0.03572654724121094, 0.04032135009765625, 0.04491615295410156, 0.049510955810546875, 0.05410575866699219, 0.0587005615234375, 0.06329536437988281, 0.06789016723632812, 0.07248497009277344, 0.07707977294921875, 0.08167457580566406, 0.08626937866210938, 0.09086418151855469, 0.095458984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 2.0, 0.0, 5.0, 5.0, 1.0, 2.0, 7.0, 5.0, 8.0, 11.0, 14.0, 23.0, 18.0, 29.0, 46.0, 45.0, 57.0, 72.0, 84.0, 72.0, 79.0, 70.0, 60.0, 55.0, 46.0, 36.0, 32.0, 28.0, 18.0, 11.0, 16.0, 13.0, 13.0, 11.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1173095703125, -0.11365413665771484, -0.10999870300292969, -0.10634326934814453, -0.10268783569335938, -0.09903240203857422, -0.09537696838378906, -0.0917215347290039, -0.08806610107421875, -0.0844106674194336, -0.08075523376464844, -0.07709980010986328, -0.07344436645507812, -0.06978893280029297, -0.06613349914550781, -0.062478065490722656, -0.0588226318359375, -0.055167198181152344, -0.05151176452636719, -0.04785633087158203, -0.044200897216796875, -0.04054546356201172, -0.03689002990722656, -0.033234596252441406, -0.02957916259765625, -0.025923728942871094, -0.022268295288085938, -0.01861286163330078, -0.014957427978515625, -0.011301994323730469, -0.0076465606689453125, -0.003991127014160156, -0.000335693359375, 0.0033197402954101562, 0.0069751739501953125, 0.010630607604980469, 0.014286041259765625, 0.01794147491455078, 0.021596908569335938, 0.025252342224121094, 0.02890777587890625, 0.032563209533691406, 0.03621864318847656, 0.03987407684326172, 0.043529510498046875, 0.04718494415283203, 0.05084037780761719, 0.054495811462402344, 0.0581512451171875, 0.061806678771972656, 0.06546211242675781, 0.06911754608154297, 0.07277297973632812, 0.07642841339111328, 0.08008384704589844, 0.0837392807006836, 0.08739471435546875, 0.0910501480102539, 0.09470558166503906, 0.09836101531982422, 0.10201644897460938, 0.10567188262939453, 0.10932731628417969, 0.11298274993896484, 0.11663818359375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 20.0, 35.0, 106.0, 190.0, 302.0, 185.0, 93.0, 37.0, 13.0, 6.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.5318427085876465, -4.419381618499756, -4.306920528411865, -4.194458961486816, -4.081997871398926, -3.969536781311035, -3.8570756912231445, -3.744614362716675, -3.632153272628784, -3.5196921825408936, -3.407230854034424, -3.294769763946533, -3.1823084354400635, -3.069847345352173, -2.957386016845703, -2.8449249267578125, -2.732463836669922, -2.6200027465820312, -2.5075414180755615, -2.395080327987671, -2.282618999481201, -2.1701579093933105, -2.05769681930542, -1.9452354907989502, -1.8327741622924805, -1.7203129529953003, -1.6078517436981201, -1.4953906536102295, -1.3829294443130493, -1.2704682350158691, -1.158007025718689, -1.0455458164215088, -0.9330847263336182, -0.820623517036438, -0.7081623673439026, -0.5957011580467224, -0.4832399785518646, -0.37077879905700684, -0.25831758975982666, -0.14585644006729126, -0.033395230770111084, 0.0790659561753273, 0.19152714312076569, 0.30398833751678467, 0.41644951701164246, 0.5289106965065002, 0.6413719058036804, 0.7538330554962158, 0.866294264793396, 0.9787554740905762, 1.0912166833877563, 1.2036778926849365, 1.3161389827728271, 1.4286001920700073, 1.5410614013671875, 1.6535224914550781, 1.7659838199615479, 1.878445029258728, 1.9909062385559082, 2.103367328643799, 2.2158286571502686, 2.328289747238159, 2.440751075744629, 2.5532121658325195, 2.66567325592041]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 5.0, 16.0, 13.0, 12.0, 21.0, 22.0, 28.0, 25.0, 33.0, 36.0, 43.0, 39.0, 46.0, 58.0, 66.0, 66.0, 50.0, 56.0, 37.0, 38.0, 36.0, 42.0, 24.0, 31.0, 28.0, 27.0, 18.0, 14.0, 9.0, 5.0, 6.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.468476414680481, -1.4217227697372437, -1.3749690055847168, -1.3282153606414795, -1.2814617156982422, -1.2347080707550049, -1.1879544258117676, -1.1412006616592407, -1.0944470167160034, -1.0476933717727661, -1.0009396076202393, -0.954185962677002, -0.9074323177337646, -0.8606786727905273, -0.8139249682426453, -0.7671712636947632, -0.7204176187515259, -0.6736639738082886, -0.6269102692604065, -0.5801565647125244, -0.5334029197692871, -0.4866492450237274, -0.4398955702781677, -0.39314189553260803, -0.34638822078704834, -0.29963454604148865, -0.25288087129592896, -0.20612719655036926, -0.15937352180480957, -0.11261984705924988, -0.06586617231369019, -0.019112497568130493, 0.02764129638671875, 0.07439497113227844, 0.12114864587783813, 0.16790232062339783, 0.21465599536895752, 0.2614096701145172, 0.3081633448600769, 0.3549170196056366, 0.4016706943511963, 0.448424369096756, 0.4951780438423157, 0.5419317483901978, 0.5886853933334351, 0.6354390382766724, 0.6821927428245544, 0.7289464473724365, 0.7757000923156738, 0.8224537372589111, 0.8692074418067932, 0.9159611463546753, 0.9627147912979126, 1.00946843624115, 1.0562222003936768, 1.102975845336914, 1.1497294902801514, 1.1964831352233887, 1.243236780166626, 1.2899905443191528, 1.3367441892623901, 1.3834978342056274, 1.4302515983581543, 1.4770052433013916, 1.523758888244629]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 5.0, 9.0, 5.0, 8.0, 10.0, 8.0, 13.0, 18.0, 30.0, 38.0, 34.0, 48.0, 60.0, 77.0, 111.0, 157.0, 245.0, 401.0, 683.0, 1176.0, 2483.0, 5559.0, 15267.0, 59527.0, 530856.0, 3092879.0, 406218.0, 51839.0, 15490.0, 5673.0, 2467.0, 1188.0, 658.0, 384.0, 224.0, 122.0, 111.0, 60.0, 41.0, 33.0, 20.0, 11.0, 12.0, 5.0, 10.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2218017578125, -0.21571731567382812, -0.20963287353515625, -0.20354843139648438, -0.1974639892578125, -0.19137954711914062, -0.18529510498046875, -0.17921066284179688, -0.173126220703125, -0.16704177856445312, -0.16095733642578125, -0.15487289428710938, -0.1487884521484375, -0.14270401000976562, -0.13661956787109375, -0.13053512573242188, -0.12445068359375, -0.11836624145507812, -0.11228179931640625, -0.10619735717773438, -0.1001129150390625, -0.09402847290039062, -0.08794403076171875, -0.08185958862304688, -0.075775146484375, -0.06969070434570312, -0.06360626220703125, -0.057521820068359375, -0.0514373779296875, -0.045352935791015625, -0.03926849365234375, -0.033184051513671875, -0.027099609375, -0.021015167236328125, -0.01493072509765625, -0.008846282958984375, -0.0027618408203125, 0.003322601318359375, 0.00940704345703125, 0.015491485595703125, 0.021575927734375, 0.027660369873046875, 0.03374481201171875, 0.039829254150390625, 0.0459136962890625, 0.051998138427734375, 0.05808258056640625, 0.06416702270507812, 0.07025146484375, 0.07633590698242188, 0.08242034912109375, 0.08850479125976562, 0.0945892333984375, 0.10067367553710938, 0.10675811767578125, 0.11284255981445312, 0.118927001953125, 0.12501144409179688, 0.13109588623046875, 0.13718032836914062, 0.1432647705078125, 0.14934921264648438, 0.15543365478515625, 0.16151809692382812, 0.1676025390625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 12.0, 5.0, 17.0, 17.0, 30.0, 25.0, 23.0, 40.0, 37.0, 56.0, 67.0, 61.0, 42.0, 54.0, 66.0, 54.0, 60.0, 56.0, 46.0, 42.0, 31.0, 36.0, 30.0, 20.0, 25.0, 7.0, 6.0, 7.0, 8.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1170654296875, -0.11359500885009766, -0.11012458801269531, -0.10665416717529297, -0.10318374633789062, -0.09971332550048828, -0.09624290466308594, -0.0927724838256836, -0.08930206298828125, -0.0858316421508789, -0.08236122131347656, -0.07889080047607422, -0.07542037963867188, -0.07194995880126953, -0.06847953796386719, -0.06500911712646484, -0.0615386962890625, -0.058068275451660156, -0.05459785461425781, -0.05112743377685547, -0.047657012939453125, -0.04418659210205078, -0.04071617126464844, -0.037245750427246094, -0.03377532958984375, -0.030304908752441406, -0.026834487915039062, -0.02336406707763672, -0.019893646240234375, -0.01642322540283203, -0.012952804565429688, -0.009482383728027344, -0.006011962890625, -0.0025415420532226562, 0.0009288787841796875, 0.004399299621582031, 0.007869720458984375, 0.011340141296386719, 0.014810562133789062, 0.018280982971191406, 0.02175140380859375, 0.025221824645996094, 0.028692245483398438, 0.03216266632080078, 0.035633087158203125, 0.03910350799560547, 0.04257392883300781, 0.046044349670410156, 0.0495147705078125, 0.052985191345214844, 0.05645561218261719, 0.05992603302001953, 0.06339645385742188, 0.06686687469482422, 0.07033729553222656, 0.0738077163696289, 0.07727813720703125, 0.0807485580444336, 0.08421897888183594, 0.08768939971923828, 0.09115982055664062, 0.09463024139404297, 0.09810066223144531, 0.10157108306884766, 0.10504150390625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 14.0, 14.0, 30.0, 38.0, 80.0, 135.0, 219.0, 436.0, 957.0, 2151.0, 6114.0, 25718.0, 276656.0, 3741231.0, 117072.0, 15994.0, 4397.0, 1579.0, 688.0, 337.0, 178.0, 98.0, 65.0, 25.0, 17.0, 19.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443359375, -0.4308204650878906, -0.41828155517578125, -0.4057426452636719, -0.3932037353515625, -0.3806648254394531, -0.36812591552734375, -0.3555870056152344, -0.343048095703125, -0.3305091857910156, -0.31797027587890625, -0.3054313659667969, -0.2928924560546875, -0.2803535461425781, -0.26781463623046875, -0.2552757263183594, -0.24273681640625, -0.23019790649414062, -0.21765899658203125, -0.20512008666992188, -0.1925811767578125, -0.18004226684570312, -0.16750335693359375, -0.15496444702148438, -0.142425537109375, -0.12988662719726562, -0.11734771728515625, -0.10480880737304688, -0.0922698974609375, -0.07973098754882812, -0.06719207763671875, -0.054653167724609375, -0.0421142578125, -0.029575347900390625, -0.01703643798828125, -0.004497528076171875, 0.0080413818359375, 0.020580291748046875, 0.03311920166015625, 0.045658111572265625, 0.058197021484375, 0.07073593139648438, 0.08327484130859375, 0.09581375122070312, 0.1083526611328125, 0.12089157104492188, 0.13343048095703125, 0.14596939086914062, 0.15850830078125, 0.17104721069335938, 0.18358612060546875, 0.19612503051757812, 0.2086639404296875, 0.22120285034179688, 0.23374176025390625, 0.24628067016601562, 0.258819580078125, 0.2713584899902344, 0.28389739990234375, 0.2964363098144531, 0.3089752197265625, 0.3215141296386719, 0.33405303955078125, 0.3465919494628906, 0.359130859375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 2.0, 5.0, 5.0, 9.0, 4.0, 11.0, 14.0, 16.0, 27.0, 25.0, 35.0, 58.0, 93.0, 151.0, 302.0, 627.0, 901.0, 793.0, 420.0, 199.0, 115.0, 59.0, 45.0, 48.0, 29.0, 16.0, 11.0, 15.0, 13.0, 3.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25, -0.24157333374023438, -0.23314666748046875, -0.22472000122070312, -0.2162933349609375, -0.20786666870117188, -0.19944000244140625, -0.19101333618164062, -0.182586669921875, -0.17416000366210938, -0.16573333740234375, -0.15730667114257812, -0.1488800048828125, -0.14045333862304688, -0.13202667236328125, -0.12360000610351562, -0.11517333984375, -0.10674667358398438, -0.09832000732421875, -0.08989334106445312, -0.0814666748046875, -0.07304000854492188, -0.06461334228515625, -0.056186676025390625, -0.047760009765625, -0.039333343505859375, -0.03090667724609375, -0.022480010986328125, -0.0140533447265625, -0.005626678466796875, 0.00279998779296875, 0.011226654052734375, 0.0196533203125, 0.028079986572265625, 0.03650665283203125, 0.044933319091796875, 0.0533599853515625, 0.061786651611328125, 0.07021331787109375, 0.07863998413085938, 0.087066650390625, 0.09549331665039062, 0.10391998291015625, 0.11234664916992188, 0.1207733154296875, 0.12919998168945312, 0.13762664794921875, 0.14605331420898438, 0.15447998046875, 0.16290664672851562, 0.17133331298828125, 0.17975997924804688, 0.1881866455078125, 0.19661331176757812, 0.20503997802734375, 0.21346664428710938, 0.221893310546875, 0.23031997680664062, 0.23874664306640625, 0.24717330932617188, 0.2555999755859375, 0.2640266418457031, 0.27245330810546875, 0.2808799743652344, 0.289306640625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 4.0, 5.0, 7.0, 6.0, 6.0, 10.0, 22.0, 28.0, 46.0, 68.0, 137.0, 140.0, 157.0, 127.0, 99.0, 55.0, 33.0, 21.0, 14.0, 10.0, 6.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.527974843978882, -3.44838285446167, -3.368790864944458, -3.289198875427246, -3.209606885910034, -3.1300148963928223, -3.0504229068756104, -2.9708309173583984, -2.8912391662597656, -2.8116471767425537, -2.732055187225342, -2.65246319770813, -2.572871208190918, -2.493279218673706, -2.413687229156494, -2.3340954780578613, -2.2545032501220703, -2.1749112606048584, -2.0953192710876465, -2.0157272815704346, -1.9361352920532227, -1.8565433025360107, -1.7769514322280884, -1.6973594427108765, -1.6177674531936646, -1.5381754636764526, -1.4585834741592407, -1.3789914846420288, -1.2993996143341064, -1.2198076248168945, -1.1402156352996826, -1.0606236457824707, -0.9810316562652588, -0.9014396667480469, -0.821847677230835, -0.7422557473182678, -0.6626637578010559, -0.583071768283844, -0.5034798383712769, -0.42388784885406494, -0.344295859336853, -0.2647038698196411, -0.1851119101047516, -0.10551993548870087, -0.025927960872650146, 0.05366402864456177, 0.1332559883594513, 0.21284794807434082, 0.29243993759155273, 0.37203192710876465, 0.4516238868236542, 0.5312158465385437, 0.6108078360557556, 0.6903998255729675, 0.7699917554855347, 0.8495837450027466, 0.9291757345199585, 1.0087677240371704, 1.0883597135543823, 1.1679517030715942, 1.2475435733795166, 1.3271355628967285, 1.4067275524139404, 1.4863195419311523, 1.5659115314483643]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 3.0, 10.0, 3.0, 13.0, 15.0, 15.0, 19.0, 12.0, 25.0, 31.0, 29.0, 44.0, 43.0, 46.0, 53.0, 50.0, 59.0, 52.0, 49.0, 58.0, 49.0, 44.0, 61.0, 33.0, 28.0, 26.0, 26.0, 26.0, 19.0, 14.0, 7.0, 6.0, 4.0, 9.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.3624032735824585, -1.3234059810638428, -1.2844088077545166, -1.2454115152359009, -1.2064142227172852, -1.1674169301986694, -1.1284196376800537, -1.0894224643707275, -1.0504251718521118, -1.011427879333496, -0.9724306464195251, -0.9334334135055542, -0.8944361209869385, -0.8554388284683228, -0.8164415955543518, -0.7774443626403809, -0.7384470701217651, -0.6994497776031494, -0.6604525446891785, -0.6214553117752075, -0.5824580192565918, -0.5434607267379761, -0.5044634938240051, -0.4654662311077118, -0.42646896839141846, -0.3874717056751251, -0.3484744429588318, -0.30947718024253845, -0.2704799175262451, -0.23148265480995178, -0.19248539209365845, -0.1534881293773651, -0.11449074745178223, -0.07549348473548889, -0.03649622201919556, 0.0025010406970977783, 0.04149830341339111, 0.08049556612968445, 0.11949282884597778, 0.15849009156227112, 0.19748735427856445, 0.2364846169948578, 0.2754818797111511, 0.31447914242744446, 0.3534764051437378, 0.39247366786003113, 0.43147093057632446, 0.4704681932926178, 0.5094654560089111, 0.5484627485275269, 0.5874599814414978, 0.6264572143554688, 0.6654545068740845, 0.7044517993927002, 0.7434490323066711, 0.7824462652206421, 0.8214435577392578, 0.8604408502578735, 0.8994380831718445, 0.9384353160858154, 0.9774326086044312, 1.0164299011230469, 1.055427074432373, 1.0944243669509888, 1.1334216594696045]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 6.0, 2.0, 5.0, 9.0, 7.0, 15.0, 11.0, 20.0, 19.0, 37.0, 38.0, 71.0, 89.0, 117.0, 194.0, 286.0, 661.0, 1254.0, 2643.0, 6164.0, 16477.0, 47911.0, 145542.0, 338936.0, 305795.0, 119291.0, 39117.0, 13553.0, 5293.0, 2327.0, 1156.0, 579.0, 334.0, 204.0, 114.0, 84.0, 54.0, 42.0, 31.0, 23.0, 11.0, 10.0, 4.0, 3.0, 4.0, 3.0, 5.0, 4.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.18408203125, -0.17748641967773438, -0.17089080810546875, -0.16429519653320312, -0.1576995849609375, -0.15110397338867188, -0.14450836181640625, -0.13791275024414062, -0.131317138671875, -0.12472152709960938, -0.11812591552734375, -0.11153030395507812, -0.1049346923828125, -0.09833908081054688, -0.09174346923828125, -0.08514785766601562, -0.07855224609375, -0.07195663452148438, -0.06536102294921875, -0.058765411376953125, -0.0521697998046875, -0.045574188232421875, -0.03897857666015625, -0.032382965087890625, -0.025787353515625, -0.019191741943359375, -0.01259613037109375, -0.006000518798828125, 0.0005950927734375, 0.007190704345703125, 0.01378631591796875, 0.020381927490234375, 0.0269775390625, 0.033573150634765625, 0.04016876220703125, 0.046764373779296875, 0.0533599853515625, 0.059955596923828125, 0.06655120849609375, 0.07314682006835938, 0.079742431640625, 0.08633804321289062, 0.09293365478515625, 0.09952926635742188, 0.1061248779296875, 0.11272048950195312, 0.11931610107421875, 0.12591171264648438, 0.13250732421875, 0.13910293579101562, 0.14569854736328125, 0.15229415893554688, 0.1588897705078125, 0.16548538208007812, 0.17208099365234375, 0.17867660522460938, 0.185272216796875, 0.19186782836914062, 0.19846343994140625, 0.20505905151367188, 0.2116546630859375, 0.21825027465820312, 0.22484588623046875, 0.23144149780273438, 0.238037109375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 5.0, 9.0, 15.0, 7.0, 13.0, 19.0, 27.0, 23.0, 42.0, 49.0, 42.0, 64.0, 54.0, 59.0, 54.0, 56.0, 71.0, 64.0, 58.0, 39.0, 55.0, 38.0, 35.0, 28.0, 18.0, 16.0, 8.0, 7.0, 3.0, 11.0, 5.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.127685546875, -0.12393951416015625, -0.1201934814453125, -0.11644744873046875, -0.112701416015625, -0.10895538330078125, -0.1052093505859375, -0.10146331787109375, -0.09771728515625, -0.09397125244140625, -0.0902252197265625, -0.08647918701171875, -0.082733154296875, -0.07898712158203125, -0.0752410888671875, -0.07149505615234375, -0.0677490234375, -0.06400299072265625, -0.0602569580078125, -0.05651092529296875, -0.052764892578125, -0.04901885986328125, -0.0452728271484375, -0.04152679443359375, -0.03778076171875, -0.03403472900390625, -0.0302886962890625, -0.02654266357421875, -0.022796630859375, -0.01905059814453125, -0.0153045654296875, -0.01155853271484375, -0.0078125, -0.00406646728515625, -0.0003204345703125, 0.00342559814453125, 0.007171630859375, 0.01091766357421875, 0.0146636962890625, 0.01840972900390625, 0.02215576171875, 0.02590179443359375, 0.0296478271484375, 0.03339385986328125, 0.037139892578125, 0.04088592529296875, 0.0446319580078125, 0.04837799072265625, 0.0521240234375, 0.05587005615234375, 0.0596160888671875, 0.06336212158203125, 0.067108154296875, 0.07085418701171875, 0.0746002197265625, 0.07834625244140625, 0.08209228515625, 0.08583831787109375, 0.0895843505859375, 0.09333038330078125, 0.097076416015625, 0.10082244873046875, 0.1045684814453125, 0.10831451416015625, 0.112060546875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 14.0, 13.0, 23.0, 22.0, 22.0, 59.0, 50.0, 100.0, 149.0, 190.0, 314.0, 453.0, 756.0, 1381.0, 2976.0, 8108.0, 32968.0, 206680.0, 643968.0, 117916.0, 21102.0, 5970.0, 2226.0, 1151.0, 686.0, 386.0, 266.0, 183.0, 119.0, 91.0, 55.0, 44.0, 33.0, 14.0, 17.0, 10.0, 8.0, 8.0, 2.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.319580078125, -0.30938720703125, -0.2991943359375, -0.28900146484375, -0.27880859375, -0.26861572265625, -0.2584228515625, -0.24822998046875, -0.238037109375, -0.22784423828125, -0.2176513671875, -0.20745849609375, -0.197265625, -0.18707275390625, -0.1768798828125, -0.16668701171875, -0.156494140625, -0.14630126953125, -0.1361083984375, -0.12591552734375, -0.11572265625, -0.10552978515625, -0.0953369140625, -0.08514404296875, -0.074951171875, -0.06475830078125, -0.0545654296875, -0.04437255859375, -0.0341796875, -0.02398681640625, -0.0137939453125, -0.00360107421875, 0.006591796875, 0.01678466796875, 0.0269775390625, 0.03717041015625, 0.04736328125, 0.05755615234375, 0.0677490234375, 0.07794189453125, 0.088134765625, 0.09832763671875, 0.1085205078125, 0.11871337890625, 0.12890625, 0.13909912109375, 0.1492919921875, 0.15948486328125, 0.169677734375, 0.17987060546875, 0.1900634765625, 0.20025634765625, 0.21044921875, 0.22064208984375, 0.2308349609375, 0.24102783203125, 0.251220703125, 0.26141357421875, 0.2716064453125, 0.28179931640625, 0.2919921875, 0.30218505859375, 0.3123779296875, 0.32257080078125, 0.332763671875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 2.0, 5.0, 12.0, 12.0, 11.0, 14.0, 11.0, 27.0, 32.0, 38.0, 39.0, 35.0, 58.0, 52.0, 48.0, 53.0, 46.0, 57.0, 46.0, 57.0, 57.0, 49.0, 44.0, 37.0, 30.0, 21.0, 19.0, 18.0, 15.0, 8.0, 7.0, 9.0, 7.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.435546875, -0.4223594665527344, -0.40917205810546875, -0.3959846496582031, -0.3827972412109375, -0.3696098327636719, -0.35642242431640625, -0.3432350158691406, -0.330047607421875, -0.3168601989746094, -0.30367279052734375, -0.2904853820800781, -0.2772979736328125, -0.2641105651855469, -0.25092315673828125, -0.23773574829101562, -0.22454833984375, -0.21136093139648438, -0.19817352294921875, -0.18498611450195312, -0.1717987060546875, -0.15861129760742188, -0.14542388916015625, -0.13223648071289062, -0.119049072265625, -0.10586166381835938, -0.09267425537109375, -0.07948684692382812, -0.0662994384765625, -0.053112030029296875, -0.03992462158203125, -0.026737213134765625, -0.0135498046875, -0.000362396240234375, 0.01282501220703125, 0.026012420654296875, 0.0391998291015625, 0.052387237548828125, 0.06557464599609375, 0.07876205444335938, 0.091949462890625, 0.10513687133789062, 0.11832427978515625, 0.13151168823242188, 0.1446990966796875, 0.15788650512695312, 0.17107391357421875, 0.18426132202148438, 0.19744873046875, 0.21063613891601562, 0.22382354736328125, 0.23701095581054688, 0.2501983642578125, 0.2633857727050781, 0.27657318115234375, 0.2897605895996094, 0.302947998046875, 0.3161354064941406, 0.32932281494140625, 0.3425102233886719, 0.3556976318359375, 0.3688850402832031, 0.38207244873046875, 0.3952598571777344, 0.408447265625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 10.0, 14.0, 16.0, 23.0, 42.0, 54.0, 83.0, 137.0, 231.0, 392.0, 600.0, 1049.0, 1901.0, 3854.0, 12028.0, 222011.0, 779607.0, 16822.0, 4702.0, 2073.0, 1157.0, 632.0, 387.0, 262.0, 140.0, 104.0, 67.0, 46.0, 25.0, 19.0, 20.0, 13.0, 7.0, 2.0, 7.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.410400390625, -0.3972053527832031, -0.38401031494140625, -0.3708152770996094, -0.3576202392578125, -0.3444252014160156, -0.33123016357421875, -0.3180351257324219, -0.304840087890625, -0.2916450500488281, -0.27845001220703125, -0.2652549743652344, -0.2520599365234375, -0.23886489868164062, -0.22566986083984375, -0.21247482299804688, -0.19927978515625, -0.18608474731445312, -0.17288970947265625, -0.15969467163085938, -0.1464996337890625, -0.13330459594726562, -0.12010955810546875, -0.10691452026367188, -0.093719482421875, -0.08052444458007812, -0.06732940673828125, -0.054134368896484375, -0.0409393310546875, -0.027744293212890625, -0.01454925537109375, -0.001354217529296875, 0.0118408203125, 0.025035858154296875, 0.03823089599609375, 0.051425933837890625, 0.0646209716796875, 0.07781600952148438, 0.09101104736328125, 0.10420608520507812, 0.117401123046875, 0.13059616088867188, 0.14379119873046875, 0.15698623657226562, 0.1701812744140625, 0.18337631225585938, 0.19657135009765625, 0.20976638793945312, 0.22296142578125, 0.23615646362304688, 0.24935150146484375, 0.2625465393066406, 0.2757415771484375, 0.2889366149902344, 0.30213165283203125, 0.3153266906738281, 0.328521728515625, 0.3417167663574219, 0.35491180419921875, 0.3681068420410156, 0.3813018798828125, 0.3944969177246094, 0.40769195556640625, 0.4208869934082031, 0.43408203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 12.0, 14.0, 27.0, 37.0, 128.0, 334.0, 268.0, 70.0, 23.0, 22.0, 15.0, 4.0, 11.0, 5.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001819133758544922, -0.00017722230404615402, -0.00017253123223781586, -0.0001678401604294777, -0.00016314908862113953, -0.00015845801681280136, -0.0001537669450044632, -0.00014907587319612503, -0.00014438480138778687, -0.0001396937295794487, -0.00013500265777111053, -0.00013031158596277237, -0.0001256205141544342, -0.00012092944234609604, -0.00011623837053775787, -0.00011154729872941971, -0.00010685622692108154, -0.00010216515511274338, -9.747408330440521e-05, -9.278301149606705e-05, -8.809193968772888e-05, -8.340086787939072e-05, -7.870979607105255e-05, -7.401872426271439e-05, -6.932765245437622e-05, -6.463658064603806e-05, -5.994550883769989e-05, -5.5254437029361725e-05, -5.056336522102356e-05, -4.5872293412685394e-05, -4.118122160434723e-05, -3.6490149796009064e-05, -3.17990779876709e-05, -2.7108006179332733e-05, -2.2416934370994568e-05, -1.7725862562656403e-05, -1.3034790754318237e-05, -8.343718945980072e-06, -3.6526471376419067e-06, 1.0384246706962585e-06, 5.729496479034424e-06, 1.0420568287372589e-05, 1.5111640095710754e-05, 1.980271190404892e-05, 2.4493783712387085e-05, 2.918485552072525e-05, 3.3875927329063416e-05, 3.856699913740158e-05, 4.3258070945739746e-05, 4.794914275407791e-05, 5.264021456241608e-05, 5.733128637075424e-05, 6.202235817909241e-05, 6.671342998743057e-05, 7.140450179576874e-05, 7.60955736041069e-05, 8.078664541244507e-05, 8.547771722078323e-05, 9.01687890291214e-05, 9.485986083745956e-05, 9.955093264579773e-05, 0.0001042420044541359, 0.00010893307626247406, 0.00011362414807081223, 0.00011831521987915039]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 4.0, 2.0, 6.0, 9.0, 7.0, 6.0, 15.0, 26.0, 28.0, 47.0, 66.0, 104.0, 131.0, 252.0, 443.0, 720.0, 1223.0, 2810.0, 8655.0, 97809.0, 902776.0, 24260.0, 4856.0, 1931.0, 962.0, 531.0, 316.0, 166.0, 118.0, 75.0, 60.0, 36.0, 25.0, 18.0, 12.0, 12.0, 9.0, 10.0, 4.0, 9.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4169921875, -0.4036598205566406, -0.39032745361328125, -0.3769950866699219, -0.3636627197265625, -0.3503303527832031, -0.33699798583984375, -0.3236656188964844, -0.310333251953125, -0.2970008850097656, -0.28366851806640625, -0.2703361511230469, -0.2570037841796875, -0.24367141723632812, -0.23033905029296875, -0.21700668334960938, -0.20367431640625, -0.19034194946289062, -0.17700958251953125, -0.16367721557617188, -0.1503448486328125, -0.13701248168945312, -0.12368011474609375, -0.11034774780273438, -0.097015380859375, -0.08368301391601562, -0.07035064697265625, -0.057018280029296875, -0.0436859130859375, -0.030353546142578125, -0.01702117919921875, -0.003688812255859375, 0.0096435546875, 0.022975921630859375, 0.03630828857421875, 0.049640655517578125, 0.0629730224609375, 0.07630538940429688, 0.08963775634765625, 0.10297012329101562, 0.116302490234375, 0.12963485717773438, 0.14296722412109375, 0.15629959106445312, 0.1696319580078125, 0.18296432495117188, 0.19629669189453125, 0.20962905883789062, 0.22296142578125, 0.23629379272460938, 0.24962615966796875, 0.2629585266113281, 0.2762908935546875, 0.2896232604980469, 0.30295562744140625, 0.3162879943847656, 0.329620361328125, 0.3429527282714844, 0.35628509521484375, 0.3696174621582031, 0.3829498291015625, 0.3962821960449219, 0.40961456298828125, 0.4229469299316406, 0.436279296875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 6.0, 2.0, 3.0, 4.0, 3.0, 6.0, 14.0, 22.0, 54.0, 156.0, 234.0, 255.0, 141.0, 51.0, 26.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.387939453125, -0.3750419616699219, -0.36214447021484375, -0.3492469787597656, -0.3363494873046875, -0.3234519958496094, -0.31055450439453125, -0.2976570129394531, -0.284759521484375, -0.2718620300292969, -0.25896453857421875, -0.24606704711914062, -0.2331695556640625, -0.22027206420898438, -0.20737457275390625, -0.19447708129882812, -0.18157958984375, -0.16868209838867188, -0.15578460693359375, -0.14288711547851562, -0.1299896240234375, -0.11709213256835938, -0.10419464111328125, -0.09129714965820312, -0.078399658203125, -0.06550216674804688, -0.05260467529296875, -0.039707183837890625, -0.0268096923828125, -0.013912200927734375, -0.00101470947265625, 0.011882781982421875, 0.0247802734375, 0.037677764892578125, 0.05057525634765625, 0.06347274780273438, 0.0763702392578125, 0.08926773071289062, 0.10216522216796875, 0.11506271362304688, 0.127960205078125, 0.14085769653320312, 0.15375518798828125, 0.16665267944335938, 0.1795501708984375, 0.19244766235351562, 0.20534515380859375, 0.21824264526367188, 0.23114013671875, 0.24403762817382812, 0.25693511962890625, 0.2698326110839844, 0.2827301025390625, 0.2956275939941406, 0.30852508544921875, 0.3214225769042969, 0.334320068359375, 0.3472175598144531, 0.36011505126953125, 0.3730125427246094, 0.3859100341796875, 0.3988075256347656, 0.41170501708984375, 0.4246025085449219, 0.4375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 20.0, 78.0, 231.0, 411.0, 171.0, 50.0, 24.0, 9.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.280939102172852, -9.990006446838379, -9.699074745178223, -9.40814208984375, -9.117210388183594, -8.826277732849121, -8.535346031188965, -8.244413375854492, -7.953481197357178, -7.662549018859863, -7.371616840362549, -7.080684661865234, -6.789752006530762, -6.4988203048706055, -6.207887649536133, -5.916955471038818, -5.626023292541504, -5.3350911140441895, -5.044158935546875, -4.7532267570495605, -4.462294578552246, -4.171361923217773, -3.880429744720459, -3.5894975662231445, -3.29856538772583, -3.0076332092285156, -2.716701030731201, -2.4257686138153076, -2.134836435317993, -1.8439042568206787, -1.5529719591140747, -1.2620396614074707, -0.9711084365844727, -0.6801761984825134, -0.3892439603805542, -0.09831172227859497, 0.19262051582336426, 0.4835526943206787, 0.7744849920272827, 1.0654172897338867, 1.3563494682312012, 1.6472816467285156, 1.9382139444351196, 2.2291462421417236, 2.520078420639038, 2.8110105991363525, 3.101943016052246, 3.3928751945495605, 3.683807373046875, 3.9747395515441895, 4.265671730041504, 4.556603908538818, 4.847536087036133, 5.1384687423706055, 5.42940092086792, 5.720333099365234, 6.011265277862549, 6.302197456359863, 6.593129634857178, 6.884061813354492, 7.174994468688965, 7.465926170349121, 7.756858825683594, 8.04779052734375, 8.338723182678223]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 3.0, 7.0, 7.0, 12.0, 16.0, 17.0, 15.0, 24.0, 25.0, 18.0, 26.0, 13.0, 36.0, 41.0, 38.0, 43.0, 42.0, 67.0, 60.0, 59.0, 51.0, 34.0, 35.0, 28.0, 36.0, 33.0, 31.0, 25.0, 20.0, 20.0, 11.0, 19.0, 11.0, 7.0, 8.0, 11.0, 6.0, 5.0, 3.0, 6.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5542694330215454, -1.503637433052063, -1.4530055522918701, -1.4023735523223877, -1.3517415523529053, -1.3011095523834229, -1.2504775524139404, -1.1998456716537476, -1.1492136716842651, -1.0985816717147827, -1.0479497909545898, -0.9973177909851074, -0.946685791015625, -0.8960537910461426, -0.8454218506813049, -0.7947899103164673, -0.7441579103469849, -0.6935259103775024, -0.6428939700126648, -0.5922620296478271, -0.5416300296783447, -0.4909980595111847, -0.44036608934402466, -0.3897341191768646, -0.3391021490097046, -0.28847017884254456, -0.23783820867538452, -0.1872062385082245, -0.13657426834106445, -0.08594229817390442, -0.035310328006744385, 0.01532164216041565, 0.06595349311828613, 0.11658546328544617, 0.1672174334526062, 0.21784940361976624, 0.26848137378692627, 0.3191133439540863, 0.36974531412124634, 0.42037728428840637, 0.4710092544555664, 0.5216412544250488, 0.5722731947898865, 0.6229051351547241, 0.6735371351242065, 0.724169135093689, 0.7748010754585266, 0.8254330158233643, 0.8760650157928467, 0.9266970157623291, 0.9773289561271667, 1.0279608964920044, 1.0785928964614868, 1.1292248964309692, 1.179856777191162, 1.2304887771606445, 1.281120777130127, 1.3317527770996094, 1.3823847770690918, 1.4330166578292847, 1.483648657798767, 1.5342806577682495, 1.5849125385284424, 1.6355445384979248, 1.6861765384674072]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 7.0, 14.0, 23.0, 24.0, 36.0, 41.0, 60.0, 105.0, 158.0, 235.0, 409.0, 838.0, 1761.0, 4675.0, 16707.0, 159459.0, 3571064.0, 399961.0, 27656.0, 6441.0, 2356.0, 1070.0, 484.0, 276.0, 145.0, 94.0, 50.0, 46.0, 24.0, 15.0, 11.0, 9.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.41162109375, -0.4006805419921875, -0.389739990234375, -0.3787994384765625, -0.36785888671875, -0.3569183349609375, -0.345977783203125, -0.3350372314453125, -0.3240966796875, -0.3131561279296875, -0.302215576171875, -0.2912750244140625, -0.28033447265625, -0.2693939208984375, -0.258453369140625, -0.2475128173828125, -0.236572265625, -0.2256317138671875, -0.214691162109375, -0.2037506103515625, -0.19281005859375, -0.1818695068359375, -0.170928955078125, -0.1599884033203125, -0.1490478515625, -0.1381072998046875, -0.127166748046875, -0.1162261962890625, -0.10528564453125, -0.0943450927734375, -0.083404541015625, -0.0724639892578125, -0.0615234375, -0.0505828857421875, -0.039642333984375, -0.0287017822265625, -0.01776123046875, -0.0068206787109375, 0.004119873046875, 0.0150604248046875, 0.0260009765625, 0.0369415283203125, 0.047882080078125, 0.0588226318359375, 0.06976318359375, 0.0807037353515625, 0.091644287109375, 0.1025848388671875, 0.113525390625, 0.1244659423828125, 0.135406494140625, 0.1463470458984375, 0.15728759765625, 0.1682281494140625, 0.179168701171875, 0.1901092529296875, 0.2010498046875, 0.2119903564453125, 0.222930908203125, 0.2338714599609375, 0.24481201171875, 0.2557525634765625, 0.266693115234375, 0.2776336669921875, 0.28857421875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 5.0, 11.0, 13.0, 17.0, 16.0, 27.0, 30.0, 42.0, 56.0, 49.0, 60.0, 61.0, 66.0, 55.0, 80.0, 57.0, 66.0, 52.0, 46.0, 45.0, 41.0, 26.0, 23.0, 17.0, 13.0, 9.0, 7.0, 9.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1497802734375, -0.14558982849121094, -0.14139938354492188, -0.1372089385986328, -0.13301849365234375, -0.1288280487060547, -0.12463760375976562, -0.12044715881347656, -0.1162567138671875, -0.11206626892089844, -0.10787582397460938, -0.10368537902832031, -0.09949493408203125, -0.09530448913574219, -0.09111404418945312, -0.08692359924316406, -0.082733154296875, -0.07854270935058594, -0.07435226440429688, -0.07016181945800781, -0.06597137451171875, -0.06178092956542969, -0.057590484619140625, -0.05340003967285156, -0.0492095947265625, -0.04501914978027344, -0.040828704833984375, -0.03663825988769531, -0.03244781494140625, -0.028257369995117188, -0.024066925048828125, -0.019876480102539062, -0.01568603515625, -0.011495590209960938, -0.007305145263671875, -0.0031147003173828125, 0.00107574462890625, 0.0052661895751953125, 0.009456634521484375, 0.013647079467773438, 0.0178375244140625, 0.022027969360351562, 0.026218414306640625, 0.030408859252929688, 0.03459930419921875, 0.03878974914550781, 0.042980194091796875, 0.04717063903808594, 0.051361083984375, 0.05555152893066406, 0.059741973876953125, 0.06393241882324219, 0.06812286376953125, 0.07231330871582031, 0.07650375366210938, 0.08069419860839844, 0.0848846435546875, 0.08907508850097656, 0.09326553344726562, 0.09745597839355469, 0.10164642333984375, 0.10583686828613281, 0.11002731323242188, 0.11421775817871094, 0.118408203125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 18.0, 17.0, 26.0, 28.0, 48.0, 76.0, 110.0, 163.0, 306.0, 581.0, 1865.0, 8984.0, 110836.0, 3955544.0, 104474.0, 8481.0, 1636.0, 505.0, 245.0, 113.0, 72.0, 42.0, 38.0, 18.0, 11.0, 9.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.904296875, -0.8825035095214844, -0.8607101440429688, -0.8389167785644531, -0.8171234130859375, -0.7953300476074219, -0.7735366821289062, -0.7517433166503906, -0.729949951171875, -0.7081565856933594, -0.6863632202148438, -0.6645698547363281, -0.6427764892578125, -0.6209831237792969, -0.5991897583007812, -0.5773963928222656, -0.55560302734375, -0.5338096618652344, -0.5120162963867188, -0.4902229309082031, -0.4684295654296875, -0.4466361999511719, -0.42484283447265625, -0.4030494689941406, -0.381256103515625, -0.3594627380371094, -0.33766937255859375, -0.3158760070800781, -0.2940826416015625, -0.2722892761230469, -0.25049591064453125, -0.22870254516601562, -0.2069091796875, -0.18511581420898438, -0.16332244873046875, -0.14152908325195312, -0.1197357177734375, -0.09794235229492188, -0.07614898681640625, -0.054355621337890625, -0.032562255859375, -0.010768890380859375, 0.01102447509765625, 0.032817840576171875, 0.0546112060546875, 0.07640457153320312, 0.09819793701171875, 0.11999130249023438, 0.14178466796875, 0.16357803344726562, 0.18537139892578125, 0.20716476440429688, 0.2289581298828125, 0.2507514953613281, 0.27254486083984375, 0.2943382263183594, 0.316131591796875, 0.3379249572753906, 0.35971832275390625, 0.3815116882324219, 0.4033050537109375, 0.4250984191894531, 0.44689178466796875, 0.4686851501464844, 0.490478515625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 2.0, 9.0, 15.0, 19.0, 13.0, 22.0, 49.0, 59.0, 120.0, 205.0, 510.0, 1050.0, 1087.0, 455.0, 190.0, 100.0, 62.0, 26.0, 27.0, 21.0, 14.0, 6.0, 6.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56787109375, -0.5540008544921875, -0.540130615234375, -0.5262603759765625, -0.51239013671875, -0.4985198974609375, -0.484649658203125, -0.4707794189453125, -0.4569091796875, -0.4430389404296875, -0.429168701171875, -0.4152984619140625, -0.40142822265625, -0.3875579833984375, -0.373687744140625, -0.3598175048828125, -0.345947265625, -0.3320770263671875, -0.318206787109375, -0.3043365478515625, -0.29046630859375, -0.2765960693359375, -0.262725830078125, -0.2488555908203125, -0.2349853515625, -0.2211151123046875, -0.207244873046875, -0.1933746337890625, -0.17950439453125, -0.1656341552734375, -0.151763916015625, -0.1378936767578125, -0.1240234375, -0.1101531982421875, -0.096282958984375, -0.0824127197265625, -0.06854248046875, -0.0546722412109375, -0.040802001953125, -0.0269317626953125, -0.0130615234375, 0.0008087158203125, 0.014678955078125, 0.0285491943359375, 0.04241943359375, 0.0562896728515625, 0.070159912109375, 0.0840301513671875, 0.097900390625, 0.1117706298828125, 0.125640869140625, 0.1395111083984375, 0.15338134765625, 0.1672515869140625, 0.181121826171875, 0.1949920654296875, 0.2088623046875, 0.2227325439453125, 0.236602783203125, 0.2504730224609375, 0.26434326171875, 0.2782135009765625, 0.292083740234375, 0.3059539794921875, 0.31982421875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 9.0, 18.0, 20.0, 54.0, 111.0, 199.0, 248.0, 179.0, 86.0, 31.0, 13.0, 14.0, 6.0, 5.0, 2.0, 0.0, 0.0, 3.0], "bins": [-9.009161949157715, -8.837362289428711, -8.665562629699707, -8.493762969970703, -8.3219633102417, -8.150163650512695, -7.978363990783691, -7.8065643310546875, -7.634764671325684, -7.46296501159668, -7.291165351867676, -7.119365692138672, -6.947566032409668, -6.775766372680664, -6.60396671295166, -6.432167053222656, -6.260367393493652, -6.088567733764648, -5.9167680740356445, -5.744968414306641, -5.573168754577637, -5.401369094848633, -5.229569435119629, -5.057769775390625, -4.885969638824463, -4.714169979095459, -4.542370319366455, -4.370570659637451, -4.198770999908447, -4.026971340179443, -3.8551716804504395, -3.6833720207214355, -3.5115723609924316, -3.3397727012634277, -3.167973041534424, -2.99617338180542, -2.824373722076416, -2.652574062347412, -2.480774402618408, -2.3089747428894043, -2.1371750831604004, -1.9653754234313965, -1.7935757637023926, -1.6217761039733887, -1.4499764442443848, -1.2781767845153809, -1.1063770055770874, -0.9345773458480835, -0.76277756690979, -0.5909779071807861, -0.41917821764945984, -0.24737852811813354, -0.07557886838912964, 0.09622079133987427, 0.26802051067352295, 0.43982017040252686, 0.6116198301315308, 0.7834194898605347, 0.9552191495895386, 1.127018928527832, 1.298818588256836, 1.4706182479858398, 1.6424179077148438, 1.8142175674438477, 1.9860172271728516]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 7.0, 12.0, 11.0, 22.0, 21.0, 29.0, 30.0, 45.0, 46.0, 49.0, 64.0, 69.0, 53.0, 56.0, 55.0, 74.0, 45.0, 51.0, 58.0, 43.0, 41.0, 27.0, 23.0, 21.0, 11.0, 10.0, 4.0, 7.0, 4.0, 1.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.224336624145508, -2.1615514755249023, -2.098766326904297, -2.0359809398651123, -1.9731957912445068, -1.9104106426239014, -1.847625494003296, -1.7848403453826904, -1.7220550775527954, -1.65926992893219, -1.596484661102295, -1.5336995124816895, -1.470914363861084, -1.408129096031189, -1.3453439474105835, -1.2825586795806885, -1.219773530960083, -1.1569883823394775, -1.0942031145095825, -1.031417965888977, -0.9686327576637268, -0.9058475494384766, -0.8430624008178711, -0.7802771925926208, -0.7174919843673706, -0.6547067761421204, -0.5919215679168701, -0.5291364192962646, -0.4663512110710144, -0.40356600284576416, -0.3407808244228363, -0.27799564599990845, -0.21521055698394775, -0.1524253636598587, -0.08964017033576965, -0.026854977011680603, 0.03593021631240845, 0.09871542453765869, 0.16150060296058655, 0.2242857813835144, 0.28707098960876465, 0.3498561978340149, 0.41264137625694275, 0.4754265546798706, 0.5382117629051208, 0.6009969711303711, 0.6637821197509766, 0.7265673279762268, 0.789352536201477, 0.8521377444267273, 0.9149229526519775, 0.977708101272583, 1.0404932498931885, 1.1032785177230835, 1.166063666343689, 1.228848934173584, 1.2916340827941895, 1.354419231414795, 1.41720449924469, 1.4799896478652954, 1.5427749156951904, 1.605560064315796, 1.6683452129364014, 1.7311303615570068, 1.7939156293869019]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 8.0, 18.0, 13.0, 26.0, 31.0, 39.0, 55.0, 88.0, 159.0, 262.0, 487.0, 837.0, 1697.0, 3058.0, 6612.0, 14572.0, 35942.0, 95755.0, 260614.0, 359649.0, 165569.0, 59844.0, 23441.0, 9984.0, 4590.0, 2340.0, 1261.0, 664.0, 364.0, 208.0, 121.0, 84.0, 51.0, 39.0, 19.0, 18.0, 13.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.285888671875, -0.27800559997558594, -0.2701225280761719, -0.2622394561767578, -0.25435638427734375, -0.2464733123779297, -0.23859024047851562, -0.23070716857910156, -0.2228240966796875, -0.21494102478027344, -0.20705795288085938, -0.1991748809814453, -0.19129180908203125, -0.1834087371826172, -0.17552566528320312, -0.16764259338378906, -0.159759521484375, -0.15187644958496094, -0.14399337768554688, -0.1361103057861328, -0.12822723388671875, -0.12034416198730469, -0.11246109008789062, -0.10457801818847656, -0.0966949462890625, -0.08881187438964844, -0.08092880249023438, -0.07304573059082031, -0.06516265869140625, -0.05727958679199219, -0.049396514892578125, -0.04151344299316406, -0.03363037109375, -0.025747299194335938, -0.017864227294921875, -0.009981155395507812, -0.00209808349609375, 0.0057849884033203125, 0.013668060302734375, 0.021551132202148438, 0.0294342041015625, 0.03731727600097656, 0.045200347900390625, 0.05308341979980469, 0.06096649169921875, 0.06884956359863281, 0.07673263549804688, 0.08461570739746094, 0.092498779296875, 0.10038185119628906, 0.10826492309570312, 0.11614799499511719, 0.12403106689453125, 0.1319141387939453, 0.13979721069335938, 0.14768028259277344, 0.1555633544921875, 0.16344642639160156, 0.17132949829101562, 0.1792125701904297, 0.18709564208984375, 0.1949787139892578, 0.20286178588867188, 0.21074485778808594, 0.2186279296875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 3.0, 13.0, 14.0, 14.0, 25.0, 29.0, 30.0, 42.0, 51.0, 45.0, 52.0, 53.0, 51.0, 54.0, 56.0, 56.0, 59.0, 59.0, 54.0, 43.0, 34.0, 38.0, 30.0, 20.0, 17.0, 19.0, 15.0, 3.0, 10.0, 4.0, 3.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1602783203125, -0.15598392486572266, -0.1516895294189453, -0.14739513397216797, -0.14310073852539062, -0.13880634307861328, -0.13451194763183594, -0.1302175521850586, -0.12592315673828125, -0.1216287612915039, -0.11733436584472656, -0.11303997039794922, -0.10874557495117188, -0.10445117950439453, -0.10015678405761719, -0.09586238861083984, -0.0915679931640625, -0.08727359771728516, -0.08297920227050781, -0.07868480682373047, -0.07439041137695312, -0.07009601593017578, -0.06580162048339844, -0.061507225036621094, -0.05721282958984375, -0.052918434143066406, -0.04862403869628906, -0.04432964324951172, -0.040035247802734375, -0.03574085235595703, -0.03144645690917969, -0.027152061462402344, -0.022857666015625, -0.018563270568847656, -0.014268875122070312, -0.009974479675292969, -0.005680084228515625, -0.0013856887817382812, 0.0029087066650390625, 0.007203102111816406, 0.01149749755859375, 0.015791893005371094, 0.020086288452148438, 0.02438068389892578, 0.028675079345703125, 0.03296947479248047, 0.03726387023925781, 0.041558265686035156, 0.0458526611328125, 0.050147056579589844, 0.05444145202636719, 0.05873584747314453, 0.06303024291992188, 0.06732463836669922, 0.07161903381347656, 0.0759134292602539, 0.08020782470703125, 0.0845022201538086, 0.08879661560058594, 0.09309101104736328, 0.09738540649414062, 0.10167980194091797, 0.10597419738769531, 0.11026859283447266, 0.11456298828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 9.0, 2.0, 1.0, 12.0, 7.0, 17.0, 24.0, 21.0, 30.0, 51.0, 60.0, 77.0, 95.0, 131.0, 199.0, 284.0, 393.0, 580.0, 868.0, 1401.0, 2717.0, 5681.0, 13954.0, 44123.0, 185740.0, 603733.0, 132411.0, 33388.0, 11421.0, 4764.0, 2371.0, 1321.0, 814.0, 542.0, 369.0, 252.0, 184.0, 140.0, 91.0, 69.0, 45.0, 51.0, 21.0, 27.0, 15.0, 16.0, 9.0, 12.0, 6.0, 5.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.37109375, -0.3596382141113281, -0.34818267822265625, -0.3367271423339844, -0.3252716064453125, -0.3138160705566406, -0.30236053466796875, -0.2909049987792969, -0.279449462890625, -0.2679939270019531, -0.25653839111328125, -0.24508285522460938, -0.2336273193359375, -0.22217178344726562, -0.21071624755859375, -0.19926071166992188, -0.18780517578125, -0.17634963989257812, -0.16489410400390625, -0.15343856811523438, -0.1419830322265625, -0.13052749633789062, -0.11907196044921875, -0.10761642456054688, -0.096160888671875, -0.08470535278320312, -0.07324981689453125, -0.061794281005859375, -0.0503387451171875, -0.038883209228515625, -0.02742767333984375, -0.015972137451171875, -0.0045166015625, 0.006938934326171875, 0.01839447021484375, 0.029850006103515625, 0.0413055419921875, 0.052761077880859375, 0.06421661376953125, 0.07567214965820312, 0.087127685546875, 0.09858322143554688, 0.11003875732421875, 0.12149429321289062, 0.1329498291015625, 0.14440536499023438, 0.15586090087890625, 0.16731643676757812, 0.17877197265625, 0.19022750854492188, 0.20168304443359375, 0.21313858032226562, 0.2245941162109375, 0.23604965209960938, 0.24750518798828125, 0.2589607238769531, 0.270416259765625, 0.2818717956542969, 0.29332733154296875, 0.3047828674316406, 0.3162384033203125, 0.3276939392089844, 0.33914947509765625, 0.3506050109863281, 0.362060546875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 3.0, 8.0, 4.0, 11.0, 9.0, 11.0, 15.0, 12.0, 21.0, 22.0, 26.0, 27.0, 19.0, 21.0, 37.0, 38.0, 52.0, 40.0, 62.0, 43.0, 55.0, 60.0, 46.0, 51.0, 37.0, 37.0, 44.0, 29.0, 17.0, 25.0, 16.0, 14.0, 21.0, 16.0, 8.0, 8.0, 7.0, 4.0, 6.0, 5.0, 8.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48046875, -0.4659690856933594, -0.45146942138671875, -0.4369697570800781, -0.4224700927734375, -0.4079704284667969, -0.39347076416015625, -0.3789710998535156, -0.364471435546875, -0.3499717712402344, -0.33547210693359375, -0.3209724426269531, -0.3064727783203125, -0.2919731140136719, -0.27747344970703125, -0.2629737854003906, -0.24847412109375, -0.23397445678710938, -0.21947479248046875, -0.20497512817382812, -0.1904754638671875, -0.17597579956054688, -0.16147613525390625, -0.14697647094726562, -0.132476806640625, -0.11797714233398438, -0.10347747802734375, -0.08897781372070312, -0.0744781494140625, -0.059978485107421875, -0.04547882080078125, -0.030979156494140625, -0.0164794921875, -0.001979827880859375, 0.01251983642578125, 0.027019500732421875, 0.0415191650390625, 0.056018829345703125, 0.07051849365234375, 0.08501815795898438, 0.099517822265625, 0.11401748657226562, 0.12851715087890625, 0.14301681518554688, 0.1575164794921875, 0.17201614379882812, 0.18651580810546875, 0.20101547241210938, 0.21551513671875, 0.23001480102539062, 0.24451446533203125, 0.2590141296386719, 0.2735137939453125, 0.2880134582519531, 0.30251312255859375, 0.3170127868652344, 0.331512451171875, 0.3460121154785156, 0.36051177978515625, 0.3750114440917969, 0.3895111083984375, 0.4040107727050781, 0.41851043701171875, 0.4330101013183594, 0.447509765625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 7.0, 9.0, 7.0, 30.0, 18.0, 25.0, 55.0, 63.0, 72.0, 133.0, 235.0, 380.0, 704.0, 1296.0, 2860.0, 6628.0, 18847.0, 108301.0, 809561.0, 72868.0, 15474.0, 5715.0, 2453.0, 1258.0, 608.0, 381.0, 190.0, 123.0, 86.0, 51.0, 27.0, 25.0, 23.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.2822265625, -0.2726325988769531, -0.26303863525390625, -0.2534446716308594, -0.2438507080078125, -0.23425674438476562, -0.22466278076171875, -0.21506881713867188, -0.205474853515625, -0.19588088989257812, -0.18628692626953125, -0.17669296264648438, -0.1670989990234375, -0.15750503540039062, -0.14791107177734375, -0.13831710815429688, -0.12872314453125, -0.11912918090820312, -0.10953521728515625, -0.09994125366210938, -0.0903472900390625, -0.08075332641601562, -0.07115936279296875, -0.061565399169921875, -0.051971435546875, -0.042377471923828125, -0.03278350830078125, -0.023189544677734375, -0.0135955810546875, -0.004001617431640625, 0.00559234619140625, 0.015186309814453125, 0.0247802734375, 0.034374237060546875, 0.04396820068359375, 0.053562164306640625, 0.0631561279296875, 0.07275009155273438, 0.08234405517578125, 0.09193801879882812, 0.101531982421875, 0.11112594604492188, 0.12071990966796875, 0.13031387329101562, 0.1399078369140625, 0.14950180053710938, 0.15909576416015625, 0.16868972778320312, 0.17828369140625, 0.18787765502929688, 0.19747161865234375, 0.20706558227539062, 0.2166595458984375, 0.22625350952148438, 0.23584747314453125, 0.24544143676757812, 0.255035400390625, 0.2646293640136719, 0.27422332763671875, 0.2838172912597656, 0.2934112548828125, 0.3030052185058594, 0.31259918212890625, 0.3221931457519531, 0.331787109375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 9.0, 7.0, 5.0, 16.0, 19.0, 35.0, 39.0, 106.0, 254.0, 270.0, 103.0, 36.0, 34.0, 17.0, 15.0, 7.0, 6.0, 7.0, 4.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00019872188568115234, -0.00019375327974557877, -0.0001887846738100052, -0.0001838160678744316, -0.00017884746193885803, -0.00017387885600328445, -0.00016891025006771088, -0.0001639416441321373, -0.00015897303819656372, -0.00015400443226099014, -0.00014903582632541656, -0.000144067220389843, -0.0001390986144542694, -0.00013413000851869583, -0.00012916140258312225, -0.00012419279664754868, -0.0001192241907119751, -0.00011425558477640152, -0.00010928697884082794, -0.00010431837290525436, -9.934976696968079e-05, -9.438116103410721e-05, -8.941255509853363e-05, -8.444394916296005e-05, -7.947534322738647e-05, -7.45067372918129e-05, -6.953813135623932e-05, -6.456952542066574e-05, -5.960091948509216e-05, -5.4632313549518585e-05, -4.966370761394501e-05, -4.469510167837143e-05, -3.972649574279785e-05, -3.4757889807224274e-05, -2.9789283871650696e-05, -2.4820677936077118e-05, -1.985207200050354e-05, -1.4883466064929962e-05, -9.914860129356384e-06, -4.946254193782806e-06, 2.2351741790771484e-08, 4.990957677364349e-06, 9.959563612937927e-06, 1.4928169548511505e-05, 1.9896775484085083e-05, 2.486538141965866e-05, 2.983398735523224e-05, 3.480259329080582e-05, 3.9771199226379395e-05, 4.473980516195297e-05, 4.970841109752655e-05, 5.467701703310013e-05, 5.9645622968673706e-05, 6.461422890424728e-05, 6.958283483982086e-05, 7.455144077539444e-05, 7.952004671096802e-05, 8.44886526465416e-05, 8.945725858211517e-05, 9.442586451768875e-05, 9.939447045326233e-05, 0.00010436307638883591, 0.00010933168232440948, 0.00011430028825998306, 0.00011926889419555664]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 5.0, 12.0, 14.0, 31.0, 42.0, 39.0, 52.0, 87.0, 144.0, 215.0, 352.0, 596.0, 1192.0, 2481.0, 5864.0, 18197.0, 107214.0, 788014.0, 96042.0, 17247.0, 5676.0, 2315.0, 1139.0, 607.0, 342.0, 203.0, 117.0, 92.0, 61.0, 34.0, 29.0, 22.0, 19.0, 13.0, 9.0, 7.0, 8.0, 1.0, 5.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.228271484375, -0.2196502685546875, -0.211029052734375, -0.2024078369140625, -0.19378662109375, -0.1851654052734375, -0.176544189453125, -0.1679229736328125, -0.1593017578125, -0.1506805419921875, -0.142059326171875, -0.1334381103515625, -0.12481689453125, -0.1161956787109375, -0.107574462890625, -0.0989532470703125, -0.09033203125, -0.0817108154296875, -0.073089599609375, -0.0644683837890625, -0.05584716796875, -0.0472259521484375, -0.038604736328125, -0.0299835205078125, -0.0213623046875, -0.0127410888671875, -0.004119873046875, 0.0045013427734375, 0.01312255859375, 0.0217437744140625, 0.030364990234375, 0.0389862060546875, 0.047607421875, 0.0562286376953125, 0.064849853515625, 0.0734710693359375, 0.08209228515625, 0.0907135009765625, 0.099334716796875, 0.1079559326171875, 0.1165771484375, 0.1251983642578125, 0.133819580078125, 0.1424407958984375, 0.15106201171875, 0.1596832275390625, 0.168304443359375, 0.1769256591796875, 0.185546875, 0.1941680908203125, 0.202789306640625, 0.2114105224609375, 0.22003173828125, 0.2286529541015625, 0.237274169921875, 0.2458953857421875, 0.2545166015625, 0.2631378173828125, 0.271759033203125, 0.2803802490234375, 0.28900146484375, 0.2976226806640625, 0.306243896484375, 0.3148651123046875, 0.323486328125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 6.0, 4.0, 8.0, 22.0, 19.0, 40.0, 59.0, 85.0, 111.0, 141.0, 123.0, 114.0, 82.0, 51.0, 35.0, 30.0, 18.0, 11.0, 10.0, 4.0, 2.0, 1.0, 3.0, 6.0, 1.0, 5.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.263916015625, -0.2545127868652344, -0.24510955810546875, -0.23570632934570312, -0.2263031005859375, -0.21689987182617188, -0.20749664306640625, -0.19809341430664062, -0.188690185546875, -0.17928695678710938, -0.16988372802734375, -0.16048049926757812, -0.1510772705078125, -0.14167404174804688, -0.13227081298828125, -0.12286758422851562, -0.11346435546875, -0.10406112670898438, -0.09465789794921875, -0.08525466918945312, -0.0758514404296875, -0.06644821166992188, -0.05704498291015625, -0.047641754150390625, -0.038238525390625, -0.028835296630859375, -0.01943206787109375, -0.010028839111328125, -0.0006256103515625, 0.008777618408203125, 0.01818084716796875, 0.027584075927734375, 0.0369873046875, 0.046390533447265625, 0.05579376220703125, 0.06519699096679688, 0.0746002197265625, 0.08400344848632812, 0.09340667724609375, 0.10280990600585938, 0.112213134765625, 0.12161636352539062, 0.13101959228515625, 0.14042282104492188, 0.1498260498046875, 0.15922927856445312, 0.16863250732421875, 0.17803573608398438, 0.18743896484375, 0.19684219360351562, 0.20624542236328125, 0.21564865112304688, 0.2250518798828125, 0.23445510864257812, 0.24385833740234375, 0.2532615661621094, 0.262664794921875, 0.2720680236816406, 0.28147125244140625, 0.2908744812011719, 0.3002777099609375, 0.3096809387207031, 0.31908416748046875, 0.3284873962402344, 0.337890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 17.0, 35.0, 74.0, 225.0, 274.0, 163.0, 83.0, 49.0, 29.0, 17.0, 10.0, 6.0, 1.0, 2.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-6.4491143226623535, -6.2541303634643555, -6.059146404266357, -5.864162445068359, -5.669178009033203, -5.474194049835205, -5.279210090637207, -5.084226131439209, -4.889242172241211, -4.694258213043213, -4.499274253845215, -4.304290294647217, -4.109306335449219, -3.9143221378326416, -3.7193379402160645, -3.5243539810180664, -3.3293700218200684, -3.1343860626220703, -2.9394021034240723, -2.744417905807495, -2.549433946609497, -2.354449987411499, -2.159465789794922, -1.9644818305969238, -1.7694978713989258, -1.5745139122009277, -1.3795298337936401, -1.1845457553863525, -0.9895617961883545, -0.7945777773857117, -0.5995937585830688, -0.40460968017578125, -0.209625244140625, -0.014641225337982178, 0.18034279346466064, 0.37532681226730347, 0.5703108310699463, 0.7652948498725891, 0.9602788686752319, 1.1552629470825195, 1.3502469062805176, 1.5452308654785156, 1.7402149438858032, 1.9351990222930908, 2.130182981491089, 2.325166940689087, 2.520151138305664, 2.715135097503662, 2.91011905670166, 3.105103015899658, 3.3000869750976562, 3.4950711727142334, 3.6900551319122314, 3.8850390911102295, 4.080023288726807, 4.275007247924805, 4.469991207122803, 4.664975166320801, 4.859959125518799, 5.054943084716797, 5.249927520751953, 5.444911479949951, 5.639895439147949, 5.834879398345947, 6.029863357543945]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 4.0, 5.0, 5.0, 2.0, 11.0, 7.0, 11.0, 21.0, 13.0, 15.0, 17.0, 26.0, 15.0, 31.0, 32.0, 30.0, 34.0, 39.0, 47.0, 60.0, 72.0, 58.0, 66.0, 29.0, 45.0, 38.0, 33.0, 33.0, 34.0, 23.0, 21.0, 26.0, 14.0, 14.0, 9.0, 6.0, 14.0, 9.0, 8.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.208620548248291, -2.141848087310791, -2.07507586479187, -2.008303642272949, -1.9415311813354492, -1.8747588396072388, -1.8079864978790283, -1.7412141561508179, -1.6744418144226074, -1.607669472694397, -1.5408971309661865, -1.474124789237976, -1.4073524475097656, -1.3405801057815552, -1.2738077640533447, -1.2070354223251343, -1.1402630805969238, -1.0734907388687134, -1.006718397140503, -0.9399460554122925, -0.873173713684082, -0.8064013719558716, -0.7396290302276611, -0.6728566884994507, -0.6060843467712402, -0.5393120050430298, -0.47253966331481934, -0.4057673215866089, -0.33899497985839844, -0.272222638130188, -0.20545029640197754, -0.1386779546737671, -0.07190561294555664, -0.005133271217346191, 0.06163907051086426, 0.1284114122390747, 0.19518375396728516, 0.2619560956954956, 0.32872843742370605, 0.3955007791519165, 0.46227312088012695, 0.5290454626083374, 0.5958178043365479, 0.6625901460647583, 0.7293624877929688, 0.7961348295211792, 0.8629071712493896, 0.9296795129776001, 0.9964518547058105, 1.063224196434021, 1.1299965381622314, 1.196768879890442, 1.2635412216186523, 1.3303135633468628, 1.3970859050750732, 1.4638582468032837, 1.5306305885314941, 1.5974029302597046, 1.664175271987915, 1.7309476137161255, 1.797719955444336, 1.8644922971725464, 1.9312646389007568, 1.9980369806289673, 2.0648093223571777]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 4.0, 9.0, 6.0, 9.0, 15.0, 23.0, 29.0, 38.0, 50.0, 82.0, 154.0, 266.0, 542.0, 1063.0, 3084.0, 18416.0, 2603870.0, 1546105.0, 15625.0, 2811.0, 983.0, 445.0, 274.0, 132.0, 97.0, 48.0, 30.0, 24.0, 23.0, 6.0, 8.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.7431640625, -0.723052978515625, -0.70294189453125, -0.682830810546875, -0.6627197265625, -0.642608642578125, -0.62249755859375, -0.602386474609375, -0.582275390625, -0.562164306640625, -0.54205322265625, -0.521942138671875, -0.5018310546875, -0.481719970703125, -0.46160888671875, -0.441497802734375, -0.42138671875, -0.401275634765625, -0.38116455078125, -0.361053466796875, -0.3409423828125, -0.320831298828125, -0.30072021484375, -0.280609130859375, -0.260498046875, -0.240386962890625, -0.22027587890625, -0.200164794921875, -0.1800537109375, -0.159942626953125, -0.13983154296875, -0.119720458984375, -0.099609375, -0.079498291015625, -0.05938720703125, -0.039276123046875, -0.0191650390625, 0.000946044921875, 0.02105712890625, 0.041168212890625, 0.061279296875, 0.081390380859375, 0.10150146484375, 0.121612548828125, 0.1417236328125, 0.161834716796875, 0.18194580078125, 0.202056884765625, 0.22216796875, 0.242279052734375, 0.26239013671875, 0.282501220703125, 0.3026123046875, 0.322723388671875, 0.34283447265625, 0.362945556640625, 0.383056640625, 0.403167724609375, 0.42327880859375, 0.443389892578125, 0.4635009765625, 0.483612060546875, 0.50372314453125, 0.523834228515625, 0.5439453125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 4.0, 4.0, 5.0, 8.0, 10.0, 15.0, 11.0, 20.0, 23.0, 30.0, 39.0, 46.0, 39.0, 46.0, 50.0, 60.0, 59.0, 53.0, 62.0, 47.0, 44.0, 53.0, 61.0, 34.0, 37.0, 22.0, 34.0, 21.0, 13.0, 13.0, 6.0, 12.0, 8.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.151611328125, -0.1475696563720703, -0.14352798461914062, -0.13948631286621094, -0.13544464111328125, -0.13140296936035156, -0.12736129760742188, -0.12331962585449219, -0.1192779541015625, -0.11523628234863281, -0.11119461059570312, -0.10715293884277344, -0.10311126708984375, -0.09906959533691406, -0.09502792358398438, -0.09098625183105469, -0.086944580078125, -0.08290290832519531, -0.07886123657226562, -0.07481956481933594, -0.07077789306640625, -0.06673622131347656, -0.06269454956054688, -0.05865287780761719, -0.0546112060546875, -0.05056953430175781, -0.046527862548828125, -0.04248619079589844, -0.03844451904296875, -0.03440284729003906, -0.030361175537109375, -0.026319503784179688, -0.02227783203125, -0.018236160278320312, -0.014194488525390625, -0.010152816772460938, -0.00611114501953125, -0.0020694732666015625, 0.001972198486328125, 0.0060138702392578125, 0.0100555419921875, 0.014097213745117188, 0.018138885498046875, 0.022180557250976562, 0.02622222900390625, 0.030263900756835938, 0.034305572509765625, 0.03834724426269531, 0.042388916015625, 0.04643058776855469, 0.050472259521484375, 0.05451393127441406, 0.05855560302734375, 0.06259727478027344, 0.06663894653320312, 0.07068061828613281, 0.0747222900390625, 0.07876396179199219, 0.08280563354492188, 0.08684730529785156, 0.09088897705078125, 0.09493064880371094, 0.09897232055664062, 0.10301399230957031, 0.1070556640625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 13.0, 21.0, 23.0, 52.0, 69.0, 118.0, 201.0, 477.0, 1641.0, 11066.0, 3396905.0, 773631.0, 7466.0, 1296.0, 528.0, 235.0, 171.0, 102.0, 84.0, 61.0, 49.0, 20.0, 13.0, 11.0, 8.0, 8.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.060546875, -1.0251007080078125, -0.989654541015625, -0.9542083740234375, -0.91876220703125, -0.8833160400390625, -0.847869873046875, -0.8124237060546875, -0.7769775390625, -0.7415313720703125, -0.706085205078125, -0.6706390380859375, -0.63519287109375, -0.5997467041015625, -0.564300537109375, -0.5288543701171875, -0.493408203125, -0.4579620361328125, -0.422515869140625, -0.3870697021484375, -0.35162353515625, -0.3161773681640625, -0.280731201171875, -0.2452850341796875, -0.2098388671875, -0.1743927001953125, -0.138946533203125, -0.1035003662109375, -0.06805419921875, -0.0326080322265625, 0.002838134765625, 0.0382843017578125, 0.07373046875, 0.1091766357421875, 0.144622802734375, 0.1800689697265625, 0.21551513671875, 0.2509613037109375, 0.286407470703125, 0.3218536376953125, 0.3572998046875, 0.3927459716796875, 0.428192138671875, 0.4636383056640625, 0.49908447265625, 0.5345306396484375, 0.569976806640625, 0.6054229736328125, 0.640869140625, 0.6763153076171875, 0.711761474609375, 0.7472076416015625, 0.78265380859375, 0.8180999755859375, 0.853546142578125, 0.8889923095703125, 0.9244384765625, 0.9598846435546875, 0.995330810546875, 1.0307769775390625, 1.06622314453125, 1.1016693115234375, 1.137115478515625, 1.1725616455078125, 1.2080078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 8.0, 9.0, 26.0, 38.0, 131.0, 729.0, 2279.0, 633.0, 145.0, 47.0, 25.0, 7.0, 4.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.45068359375, -0.41715240478515625, -0.3836212158203125, -0.35009002685546875, -0.316558837890625, -0.28302764892578125, -0.2494964599609375, -0.21596527099609375, -0.18243408203125, -0.14890289306640625, -0.1153717041015625, -0.08184051513671875, -0.048309326171875, -0.01477813720703125, 0.0187530517578125, 0.05228424072265625, 0.0858154296875, 0.11934661865234375, 0.1528778076171875, 0.18640899658203125, 0.219940185546875, 0.25347137451171875, 0.2870025634765625, 0.32053375244140625, 0.35406494140625, 0.38759613037109375, 0.4211273193359375, 0.45465850830078125, 0.488189697265625, 0.5217208862304688, 0.5552520751953125, 0.5887832641601562, 0.622314453125, 0.6558456420898438, 0.6893768310546875, 0.7229080200195312, 0.756439208984375, 0.7899703979492188, 0.8235015869140625, 0.8570327758789062, 0.89056396484375, 0.9240951538085938, 0.9576263427734375, 0.9911575317382812, 1.024688720703125, 1.0582199096679688, 1.0917510986328125, 1.1252822875976562, 1.1588134765625, 1.1923446655273438, 1.2258758544921875, 1.2594070434570312, 1.292938232421875, 1.3264694213867188, 1.3600006103515625, 1.3935317993164062, 1.42706298828125, 1.4605941772460938, 1.4941253662109375, 1.5276565551757812, 1.561187744140625, 1.5947189331054688, 1.6282501220703125, 1.6617813110351562, 1.6953125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 19.0, 80.0, 286.0, 394.0, 147.0, 43.0, 8.0, 11.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.1671433448791504, -2.8513193130493164, -2.5354950428009033, -2.2196710109710693, -1.9038468599319458, -1.5880227088928223, -1.2721986770629883, -0.9563744068145752, -0.6405503749847412, -0.32472625374794006, -0.008902132511138916, 0.30692195892333984, 0.6227461099624634, 0.9385702610015869, 1.254394292831421, 1.570218563079834, 1.886042594909668, 2.201866626739502, 2.517690896987915, 2.833514928817749, 3.149339199066162, 3.465163230895996, 3.78098726272583, 4.096811294555664, 4.412635803222656, 4.72845983505249, 5.044283866882324, 5.360108375549316, 5.67593240737915, 5.991756439208984, 6.307580471038818, 6.623404502868652, 6.9392290115356445, 7.2550530433654785, 7.5708770751953125, 7.886701583862305, 8.20252513885498, 8.518349647521973, 8.834173202514648, 9.14999771118164, 9.465822219848633, 9.781646728515625, 10.0974702835083, 10.413294792175293, 10.729118347167969, 11.044942855834961, 11.360767364501953, 11.676590919494629, 11.992414474487305, 12.308238983154297, 12.624062538146973, 12.939887046813965, 13.25571060180664, 13.571535110473633, 13.887359619140625, 14.2031831741333, 14.519007682800293, 14.834832191467285, 15.150655746459961, 15.466480255126953, 15.782303810119629, 16.098129272460938, 16.413951873779297, 16.72977638244629, 17.04560089111328]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 7.0, 2.0, 11.0, 9.0, 5.0, 12.0, 13.0, 12.0, 22.0, 43.0, 47.0, 50.0, 55.0, 62.0, 63.0, 58.0, 64.0, 75.0, 59.0, 57.0, 54.0, 53.0, 41.0, 35.0, 15.0, 24.0, 16.0, 10.0, 9.0, 8.0, 6.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.956798553466797, -2.854630708694458, -2.752462863922119, -2.6502952575683594, -2.5481274127960205, -2.4459595680236816, -2.3437917232513428, -2.241623878479004, -2.139456033706665, -2.037288188934326, -1.9351204633712769, -1.832952618598938, -1.7307847738265991, -1.6286170482635498, -1.526449203491211, -1.424281358718872, -1.3221136331558228, -1.2199457883834839, -1.1177780628204346, -1.0156102180480957, -0.9134423732757568, -0.8112745881080627, -0.7091068029403687, -0.6069389581680298, -0.5047711730003357, -0.4026033580303192, -0.30043554306030273, -0.19826775789260864, -0.09609994292259216, 0.006067872047424316, 0.10823565721511841, 0.21040350198745728, 0.31257128715515137, 0.41473910212516785, 0.5169069170951843, 0.6190747022628784, 0.7212425470352173, 0.8234103322029114, 0.9255781173706055, 1.0277459621429443, 1.1299138069152832, 1.232081651687622, 1.3342493772506714, 1.4364172220230103, 1.5385850667953491, 1.6407527923583984, 1.7429206371307373, 1.8450884819030762, 1.9472562074661255, 2.049423933029175, 2.1515917778015137, 2.2537596225738525, 2.3559274673461914, 2.4580953121185303, 2.560263156890869, 2.662430763244629, 2.7645986080169678, 2.8667664527893066, 2.9689342975616455, 3.0711021423339844, 3.173269748687744, 3.275437593460083, 3.377605438232422, 3.4797732830047607, 3.5819411277770996]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 3.0, 13.0, 23.0, 30.0, 36.0, 56.0, 89.0, 150.0, 214.0, 313.0, 538.0, 900.0, 1534.0, 2674.0, 5031.0, 9999.0, 20057.0, 43977.0, 95396.0, 196476.0, 277593.0, 202996.0, 100766.0, 45872.0, 21354.0, 10328.0, 5311.0, 2917.0, 1563.0, 894.0, 525.0, 320.0, 213.0, 136.0, 82.0, 64.0, 32.0, 19.0, 21.0, 9.0, 7.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1824951171875, -0.1763153076171875, -0.170135498046875, -0.1639556884765625, -0.15777587890625, -0.1515960693359375, -0.145416259765625, -0.1392364501953125, -0.133056640625, -0.1268768310546875, -0.120697021484375, -0.1145172119140625, -0.10833740234375, -0.1021575927734375, -0.095977783203125, -0.0897979736328125, -0.0836181640625, -0.0774383544921875, -0.071258544921875, -0.0650787353515625, -0.05889892578125, -0.0527191162109375, -0.046539306640625, -0.0403594970703125, -0.0341796875, -0.0279998779296875, -0.021820068359375, -0.0156402587890625, -0.00946044921875, -0.0032806396484375, 0.002899169921875, 0.0090789794921875, 0.0152587890625, 0.0214385986328125, 0.027618408203125, 0.0337982177734375, 0.03997802734375, 0.0461578369140625, 0.052337646484375, 0.0585174560546875, 0.064697265625, 0.0708770751953125, 0.077056884765625, 0.0832366943359375, 0.08941650390625, 0.0955963134765625, 0.101776123046875, 0.1079559326171875, 0.1141357421875, 0.1203155517578125, 0.126495361328125, 0.1326751708984375, 0.13885498046875, 0.1450347900390625, 0.151214599609375, 0.1573944091796875, 0.16357421875, 0.1697540283203125, 0.175933837890625, 0.1821136474609375, 0.18829345703125, 0.1944732666015625, 0.200653076171875, 0.2068328857421875, 0.2130126953125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 8.0, 7.0, 9.0, 9.0, 8.0, 20.0, 11.0, 18.0, 18.0, 25.0, 36.0, 33.0, 39.0, 45.0, 40.0, 48.0, 38.0, 43.0, 48.0, 45.0, 50.0, 54.0, 50.0, 40.0, 45.0, 29.0, 26.0, 24.0, 15.0, 22.0, 11.0, 15.0, 16.0, 7.0, 8.0, 12.0, 3.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.155517578125, -0.1508464813232422, -0.14617538452148438, -0.14150428771972656, -0.13683319091796875, -0.13216209411621094, -0.12749099731445312, -0.12281990051269531, -0.1181488037109375, -0.11347770690917969, -0.10880661010742188, -0.10413551330566406, -0.09946441650390625, -0.09479331970214844, -0.09012222290039062, -0.08545112609863281, -0.080780029296875, -0.07610893249511719, -0.07143783569335938, -0.06676673889160156, -0.06209564208984375, -0.05742454528808594, -0.052753448486328125, -0.04808235168457031, -0.0434112548828125, -0.03874015808105469, -0.034069061279296875, -0.029397964477539062, -0.02472686767578125, -0.020055770874023438, -0.015384674072265625, -0.010713577270507812, -0.00604248046875, -0.0013713836669921875, 0.003299713134765625, 0.007970809936523438, 0.01264190673828125, 0.017313003540039062, 0.021984100341796875, 0.026655197143554688, 0.0313262939453125, 0.03599739074707031, 0.040668487548828125, 0.04533958435058594, 0.05001068115234375, 0.05468177795410156, 0.059352874755859375, 0.06402397155761719, 0.068695068359375, 0.07336616516113281, 0.07803726196289062, 0.08270835876464844, 0.08737945556640625, 0.09205055236816406, 0.09672164916992188, 0.10139274597167969, 0.1060638427734375, 0.11073493957519531, 0.11540603637695312, 0.12007713317871094, 0.12474822998046875, 0.12941932678222656, 0.13409042358398438, 0.1387615203857422, 0.1434326171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 3.0, 2.0, 5.0, 7.0, 7.0, 17.0, 20.0, 35.0, 50.0, 66.0, 122.0, 243.0, 580.0, 1258.0, 3546.0, 14735.0, 130044.0, 772502.0, 107249.0, 12462.0, 3288.0, 1226.0, 529.0, 247.0, 128.0, 68.0, 31.0, 25.0, 17.0, 11.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7110061645507812, -0.6891021728515625, -0.6671981811523438, -0.645294189453125, -0.6233901977539062, -0.6014862060546875, -0.5795822143554688, -0.55767822265625, -0.5357742309570312, -0.5138702392578125, -0.49196624755859375, -0.470062255859375, -0.44815826416015625, -0.4262542724609375, -0.40435028076171875, -0.3824462890625, -0.36054229736328125, -0.3386383056640625, -0.31673431396484375, -0.294830322265625, -0.27292633056640625, -0.2510223388671875, -0.22911834716796875, -0.20721435546875, -0.18531036376953125, -0.1634063720703125, -0.14150238037109375, -0.119598388671875, -0.09769439697265625, -0.0757904052734375, -0.05388641357421875, -0.031982421875, -0.01007843017578125, 0.0118255615234375, 0.03372955322265625, 0.055633544921875, 0.07753753662109375, 0.0994415283203125, 0.12134552001953125, 0.14324951171875, 0.16515350341796875, 0.1870574951171875, 0.20896148681640625, 0.230865478515625, 0.25276947021484375, 0.2746734619140625, 0.29657745361328125, 0.3184814453125, 0.34038543701171875, 0.3622894287109375, 0.38419342041015625, 0.406097412109375, 0.42800140380859375, 0.4499053955078125, 0.47180938720703125, 0.49371337890625, 0.5156173706054688, 0.5375213623046875, 0.5594253540039062, 0.581329345703125, 0.6032333374023438, 0.6251373291015625, 0.6470413208007812, 0.6689453125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 5.0, 2.0, 4.0, 3.0, 3.0, 5.0, 10.0, 22.0, 23.0, 25.0, 35.0, 61.0, 61.0, 67.0, 52.0, 83.0, 82.0, 70.0, 56.0, 58.0, 56.0, 53.0, 35.0, 23.0, 37.0, 11.0, 13.0, 14.0, 13.0, 6.0, 5.0, 3.0, 1.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0703125, -1.0378265380859375, -1.005340576171875, -0.9728546142578125, -0.94036865234375, -0.9078826904296875, -0.875396728515625, -0.8429107666015625, -0.8104248046875, -0.7779388427734375, -0.745452880859375, -0.7129669189453125, -0.68048095703125, -0.6479949951171875, -0.615509033203125, -0.5830230712890625, -0.550537109375, -0.5180511474609375, -0.485565185546875, -0.4530792236328125, -0.42059326171875, -0.3881072998046875, -0.355621337890625, -0.3231353759765625, -0.2906494140625, -0.2581634521484375, -0.225677490234375, -0.1931915283203125, -0.16070556640625, -0.1282196044921875, -0.095733642578125, -0.0632476806640625, -0.03076171875, 0.0017242431640625, 0.034210205078125, 0.0666961669921875, 0.09918212890625, 0.1316680908203125, 0.164154052734375, 0.1966400146484375, 0.2291259765625, 0.2616119384765625, 0.294097900390625, 0.3265838623046875, 0.35906982421875, 0.3915557861328125, 0.424041748046875, 0.4565277099609375, 0.489013671875, 0.5214996337890625, 0.553985595703125, 0.5864715576171875, 0.61895751953125, 0.6514434814453125, 0.683929443359375, 0.7164154052734375, 0.7489013671875, 0.7813873291015625, 0.813873291015625, 0.8463592529296875, 0.87884521484375, 0.9113311767578125, 0.943817138671875, 0.9763031005859375, 1.0087890625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 12.0, 15.0, 17.0, 23.0, 33.0, 40.0, 53.0, 76.0, 119.0, 164.0, 263.0, 406.0, 604.0, 921.0, 1516.0, 2516.0, 4523.0, 8530.0, 18312.0, 45101.0, 124288.0, 511087.0, 206232.0, 70308.0, 27203.0, 11868.0, 5855.0, 3278.0, 1857.0, 1117.0, 713.0, 431.0, 343.0, 206.0, 173.0, 75.0, 85.0, 61.0, 39.0, 34.0, 18.0, 12.0, 9.0, 5.0, 4.0, 4.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.1279296875, -0.12389755249023438, -0.11986541748046875, -0.11583328247070312, -0.1118011474609375, -0.10776901245117188, -0.10373687744140625, -0.09970474243164062, -0.095672607421875, -0.09164047241210938, -0.08760833740234375, -0.08357620239257812, -0.0795440673828125, -0.07551193237304688, -0.07147979736328125, -0.06744766235351562, -0.06341552734375, -0.059383392333984375, -0.05535125732421875, -0.051319122314453125, -0.0472869873046875, -0.043254852294921875, -0.03922271728515625, -0.035190582275390625, -0.031158447265625, -0.027126312255859375, -0.02309417724609375, -0.019062042236328125, -0.0150299072265625, -0.010997772216796875, -0.00696563720703125, -0.002933502197265625, 0.0010986328125, 0.005130767822265625, 0.00916290283203125, 0.013195037841796875, 0.0172271728515625, 0.021259307861328125, 0.02529144287109375, 0.029323577880859375, 0.033355712890625, 0.037387847900390625, 0.04141998291015625, 0.045452117919921875, 0.0494842529296875, 0.053516387939453125, 0.05754852294921875, 0.061580657958984375, 0.06561279296875, 0.06964492797851562, 0.07367706298828125, 0.07770919799804688, 0.0817413330078125, 0.08577346801757812, 0.08980560302734375, 0.09383773803710938, 0.097869873046875, 0.10190200805664062, 0.10593414306640625, 0.10996627807617188, 0.1139984130859375, 0.11803054809570312, 0.12206268310546875, 0.12609481811523438, 0.130126953125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 7.0, 13.0, 13.0, 23.0, 45.0, 67.0, 114.0, 197.0, 204.0, 108.0, 72.0, 42.0, 25.0, 23.0, 10.0, 6.0, 8.0, 6.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.298324584960938e-05, -8.910149335861206e-05, -8.521974086761475e-05, -8.133798837661743e-05, -7.745623588562012e-05, -7.35744833946228e-05, -6.969273090362549e-05, -6.581097841262817e-05, -6.192922592163086e-05, -5.8047473430633545e-05, -5.416572093963623e-05, -5.0283968448638916e-05, -4.64022159576416e-05, -4.252046346664429e-05, -3.863871097564697e-05, -3.475695848464966e-05, -3.0875205993652344e-05, -2.699345350265503e-05, -2.3111701011657715e-05, -1.92299485206604e-05, -1.5348196029663086e-05, -1.1466443538665771e-05, -7.584691047668457e-06, -3.7029385566711426e-06, 1.7881393432617188e-07, 4.060566425323486e-06, 7.9423189163208e-06, 1.1824071407318115e-05, 1.570582389831543e-05, 1.9587576389312744e-05, 2.346932888031006e-05, 2.7351081371307373e-05, 3.123283386230469e-05, 3.5114586353302e-05, 3.8996338844299316e-05, 4.287809133529663e-05, 4.6759843826293945e-05, 5.064159631729126e-05, 5.4523348808288574e-05, 5.840510129928589e-05, 6.22868537902832e-05, 6.616860628128052e-05, 7.005035877227783e-05, 7.393211126327515e-05, 7.781386375427246e-05, 8.169561624526978e-05, 8.557736873626709e-05, 8.94591212272644e-05, 9.334087371826172e-05, 9.722262620925903e-05, 0.00010110437870025635, 0.00010498613119125366, 0.00010886788368225098, 0.00011274963617324829, 0.0001166313886642456, 0.00012051314115524292, 0.00012439489364624023, 0.00012827664613723755, 0.00013215839862823486, 0.00013604015111923218, 0.0001399219036102295, 0.0001438036561012268, 0.00014768540859222412, 0.00015156716108322144, 0.00015544891357421875]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 4.0, 16.0, 18.0, 38.0, 74.0, 101.0, 237.0, 454.0, 947.0, 2068.0, 5106.0, 14883.0, 52185.0, 233718.0, 597034.0, 101584.0, 25946.0, 8316.0, 3181.0, 1284.0, 648.0, 315.0, 152.0, 95.0, 49.0, 37.0, 17.0, 8.0, 10.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.201904296875, -0.19564056396484375, -0.1893768310546875, -0.18311309814453125, -0.176849365234375, -0.17058563232421875, -0.1643218994140625, -0.15805816650390625, -0.15179443359375, -0.14553070068359375, -0.1392669677734375, -0.13300323486328125, -0.126739501953125, -0.12047576904296875, -0.1142120361328125, -0.10794830322265625, -0.1016845703125, -0.09542083740234375, -0.0891571044921875, -0.08289337158203125, -0.076629638671875, -0.07036590576171875, -0.0641021728515625, -0.05783843994140625, -0.05157470703125, -0.04531097412109375, -0.0390472412109375, -0.03278350830078125, -0.026519775390625, -0.02025604248046875, -0.0139923095703125, -0.00772857666015625, -0.00146484375, 0.00479888916015625, 0.0110626220703125, 0.01732635498046875, 0.023590087890625, 0.02985382080078125, 0.0361175537109375, 0.04238128662109375, 0.04864501953125, 0.05490875244140625, 0.0611724853515625, 0.06743621826171875, 0.073699951171875, 0.07996368408203125, 0.0862274169921875, 0.09249114990234375, 0.0987548828125, 0.10501861572265625, 0.1112823486328125, 0.11754608154296875, 0.123809814453125, 0.13007354736328125, 0.1363372802734375, 0.14260101318359375, 0.14886474609375, 0.15512847900390625, 0.1613922119140625, 0.16765594482421875, 0.173919677734375, 0.18018341064453125, 0.1864471435546875, 0.19271087646484375, 0.198974609375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 4.0, 4.0, 8.0, 7.0, 8.0, 14.0, 25.0, 16.0, 29.0, 26.0, 39.0, 56.0, 84.0, 92.0, 104.0, 100.0, 74.0, 87.0, 58.0, 44.0, 31.0, 20.0, 16.0, 16.0, 10.0, 7.0, 6.0, 4.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1798095703125, -0.1728382110595703, -0.16586685180664062, -0.15889549255371094, -0.15192413330078125, -0.14495277404785156, -0.13798141479492188, -0.1310100555419922, -0.1240386962890625, -0.11706733703613281, -0.11009597778320312, -0.10312461853027344, -0.09615325927734375, -0.08918190002441406, -0.08221054077148438, -0.07523918151855469, -0.068267822265625, -0.06129646301269531, -0.054325103759765625, -0.04735374450683594, -0.04038238525390625, -0.03341102600097656, -0.026439666748046875, -0.019468307495117188, -0.0124969482421875, -0.0055255889892578125, 0.001445770263671875, 0.008417129516601562, 0.01538848876953125, 0.022359848022460938, 0.029331207275390625, 0.03630256652832031, 0.04327392578125, 0.05024528503417969, 0.057216644287109375, 0.06418800354003906, 0.07115936279296875, 0.07813072204589844, 0.08510208129882812, 0.09207344055175781, 0.0990447998046875, 0.10601615905761719, 0.11298751831054688, 0.11995887756347656, 0.12693023681640625, 0.13390159606933594, 0.14087295532226562, 0.1478443145751953, 0.154815673828125, 0.1617870330810547, 0.16875839233398438, 0.17572975158691406, 0.18270111083984375, 0.18967247009277344, 0.19664382934570312, 0.2036151885986328, 0.2105865478515625, 0.2175579071044922, 0.22452926635742188, 0.23150062561035156, 0.23847198486328125, 0.24544334411621094, 0.2524147033691406, 0.2593860626220703, 0.266357421875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 4.0, 7.0, 8.0, 3.0, 12.0, 18.0, 35.0, 60.0, 112.0, 190.0, 329.0, 117.0, 59.0, 20.0, 14.0, 7.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.548297882080078, -8.351131439208984, -8.15396499633789, -7.956799030303955, -7.7596330642700195, -7.562466621398926, -7.36530065536499, -7.1681342124938965, -6.970968246459961, -6.773801803588867, -6.576635837554932, -6.379469394683838, -6.182303428649902, -5.985136985778809, -5.787971019744873, -5.590804576873779, -5.393638610839844, -5.19647216796875, -4.9993062019348145, -4.802139759063721, -4.604973793029785, -4.407807350158691, -4.210641384124756, -4.013474941253662, -3.8163084983825684, -3.6191422939300537, -3.421976089477539, -3.2248098850250244, -3.0276436805725098, -2.830477476119995, -2.6333112716674805, -2.4361448287963867, -2.238978862762451, -2.0418126583099365, -1.8446464538574219, -1.6474802494049072, -1.4503140449523926, -1.253147840499878, -1.0559815168380737, -0.8588153123855591, -0.6616491079330444, -0.4644829034805298, -0.26731666922569275, -0.07015043497085571, 0.12701576948165894, 0.3241819739341736, 0.521348237991333, 0.7185144424438477, 0.9156806468963623, 1.112846851348877, 1.3100130558013916, 1.5071792602539062, 1.704345464706421, 1.9015116691589355, 2.0986781120300293, 2.295844078063965, 2.4930105209350586, 2.6901767253875732, 2.887342929840088, 3.0845091342926025, 3.281675338745117, 3.478841543197632, 3.6760077476501465, 3.8731741905212402, 4.070340156555176]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 9.0, 6.0, 14.0, 11.0, 14.0, 23.0, 13.0, 20.0, 25.0, 35.0, 27.0, 36.0, 39.0, 42.0, 61.0, 81.0, 111.0, 76.0, 43.0, 34.0, 36.0, 33.0, 34.0, 26.0, 26.0, 13.0, 18.0, 15.0, 16.0, 13.0, 9.0, 7.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.6389899253845215, -4.499861240386963, -4.360732555389404, -4.221603870391846, -4.082475185394287, -3.9433465003967285, -3.804217576980591, -3.6650888919830322, -3.5259602069854736, -3.386831521987915, -3.2477028369903564, -3.108574151992798, -2.96944522857666, -2.8303165435791016, -2.691187858581543, -2.5520591735839844, -2.412930488586426, -2.273801803588867, -2.1346731185913086, -1.9955443143844604, -1.8564156293869019, -1.7172869443893433, -1.5781581401824951, -1.4390294551849365, -1.299900770187378, -1.1607720851898193, -1.0216434001922607, -0.8825145959854126, -0.743385910987854, -0.6042572259902954, -0.46512848138809204, -0.32599973678588867, -0.18687152862548828, -0.0477428138256073, 0.09138590097427368, 0.23051461577415466, 0.36964333057403564, 0.5087720155715942, 0.6479007601737976, 0.787029504776001, 0.9261581897735596, 1.0652868747711182, 1.2044155597686768, 1.343544363975525, 1.4826730489730835, 1.621801733970642, 1.7609305381774902, 1.9000592231750488, 2.0391879081726074, 2.178316593170166, 2.3174452781677246, 2.456573963165283, 2.595702648162842, 2.7348313331604004, 2.873960256576538, 3.0130889415740967, 3.1522176265716553, 3.291346311569214, 3.4304749965667725, 3.569603681564331, 3.7087326049804688, 3.8478612899780273, 3.986989974975586, 4.1261186599731445, 4.265247344970703]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 2.0, 4.0, 1.0, 4.0, 6.0, 18.0, 21.0, 26.0, 22.0, 47.0, 90.0, 130.0, 194.0, 307.0, 576.0, 1148.0, 3191.0, 15739.0, 395471.0, 3651427.0, 111934.0, 9243.0, 2383.0, 955.0, 502.0, 237.0, 211.0, 136.0, 72.0, 48.0, 48.0, 25.0, 14.0, 5.0, 13.0, 11.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.68310546875, -0.6652946472167969, -0.6474838256835938, -0.6296730041503906, -0.6118621826171875, -0.5940513610839844, -0.5762405395507812, -0.5584297180175781, -0.540618896484375, -0.5228080749511719, -0.5049972534179688, -0.4871864318847656, -0.4693756103515625, -0.4515647888183594, -0.43375396728515625, -0.4159431457519531, -0.39813232421875, -0.3803215026855469, -0.36251068115234375, -0.3446998596191406, -0.3268890380859375, -0.3090782165527344, -0.29126739501953125, -0.2734565734863281, -0.255645751953125, -0.23783493041992188, -0.22002410888671875, -0.20221328735351562, -0.1844024658203125, -0.16659164428710938, -0.14878082275390625, -0.13097000122070312, -0.1131591796875, -0.09534835815429688, -0.07753753662109375, -0.059726715087890625, -0.0419158935546875, -0.024105072021484375, -0.00629425048828125, 0.011516571044921875, 0.029327392578125, 0.047138214111328125, 0.06494903564453125, 0.08275985717773438, 0.1005706787109375, 0.11838150024414062, 0.13619232177734375, 0.15400314331054688, 0.17181396484375, 0.18962478637695312, 0.20743560791015625, 0.22524642944335938, 0.2430572509765625, 0.2608680725097656, 0.27867889404296875, 0.2964897155761719, 0.314300537109375, 0.3321113586425781, 0.34992218017578125, 0.3677330017089844, 0.3855438232421875, 0.4033546447753906, 0.42116546630859375, 0.4389762878417969, 0.456787109375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 4.0, 2.0, 7.0, 5.0, 13.0, 13.0, 20.0, 21.0, 24.0, 21.0, 45.0, 40.0, 45.0, 36.0, 58.0, 58.0, 64.0, 66.0, 65.0, 62.0, 49.0, 56.0, 34.0, 42.0, 23.0, 33.0, 21.0, 17.0, 10.0, 9.0, 9.0, 6.0, 2.0, 3.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180419921875, -0.17400741577148438, -0.16759490966796875, -0.16118240356445312, -0.1547698974609375, -0.14835739135742188, -0.14194488525390625, -0.13553237915039062, -0.129119873046875, -0.12270736694335938, -0.11629486083984375, -0.10988235473632812, -0.1034698486328125, -0.09705734252929688, -0.09064483642578125, -0.08423233032226562, -0.07781982421875, -0.07140731811523438, -0.06499481201171875, -0.058582305908203125, -0.0521697998046875, -0.045757293701171875, -0.03934478759765625, -0.032932281494140625, -0.026519775390625, -0.020107269287109375, -0.01369476318359375, -0.007282257080078125, -0.0008697509765625, 0.005542755126953125, 0.01195526123046875, 0.018367767333984375, 0.0247802734375, 0.031192779541015625, 0.03760528564453125, 0.044017791748046875, 0.0504302978515625, 0.056842803955078125, 0.06325531005859375, 0.06966781616210938, 0.076080322265625, 0.08249282836914062, 0.08890533447265625, 0.09531784057617188, 0.1017303466796875, 0.10814285278320312, 0.11455535888671875, 0.12096786499023438, 0.12738037109375, 0.13379287719726562, 0.14020538330078125, 0.14661788940429688, 0.1530303955078125, 0.15944290161132812, 0.16585540771484375, 0.17226791381835938, 0.178680419921875, 0.18509292602539062, 0.19150543212890625, 0.19791793823242188, 0.2043304443359375, 0.21074295043945312, 0.21715545654296875, 0.22356796264648438, 0.22998046875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 2.0, 6.0, 3.0, 12.0, 13.0, 15.0, 49.0, 92.0, 190.0, 387.0, 1148.0, 6102.0, 559286.0, 3613183.0, 11404.0, 1549.0, 476.0, 185.0, 90.0, 34.0, 24.0, 21.0, 8.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2529296875, -1.2113189697265625, -1.169708251953125, -1.1280975341796875, -1.08648681640625, -1.0448760986328125, -1.003265380859375, -0.9616546630859375, -0.9200439453125, -0.8784332275390625, -0.836822509765625, -0.7952117919921875, -0.75360107421875, -0.7119903564453125, -0.670379638671875, -0.6287689208984375, -0.587158203125, -0.5455474853515625, -0.503936767578125, -0.4623260498046875, -0.42071533203125, -0.3791046142578125, -0.337493896484375, -0.2958831787109375, -0.2542724609375, -0.2126617431640625, -0.171051025390625, -0.1294403076171875, -0.08782958984375, -0.0462188720703125, -0.004608154296875, 0.0370025634765625, 0.07861328125, 0.1202239990234375, 0.161834716796875, 0.2034454345703125, 0.24505615234375, 0.2866668701171875, 0.328277587890625, 0.3698883056640625, 0.4114990234375, 0.4531097412109375, 0.494720458984375, 0.5363311767578125, 0.57794189453125, 0.6195526123046875, 0.661163330078125, 0.7027740478515625, 0.744384765625, 0.7859954833984375, 0.827606201171875, 0.8692169189453125, 0.91082763671875, 0.9524383544921875, 0.994049072265625, 1.0356597900390625, 1.0772705078125, 1.1188812255859375, 1.160491943359375, 1.2021026611328125, 1.24371337890625, 1.2853240966796875, 1.326934814453125, 1.3685455322265625, 1.41015625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 5.0, 5.0, 8.0, 17.0, 15.0, 23.0, 40.0, 78.0, 166.0, 336.0, 725.0, 1114.0, 788.0, 354.0, 172.0, 84.0, 46.0, 29.0, 25.0, 15.0, 11.0, 4.0, 11.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.62939453125, -0.611175537109375, -0.59295654296875, -0.574737548828125, -0.5565185546875, -0.538299560546875, -0.52008056640625, -0.501861572265625, -0.483642578125, -0.465423583984375, -0.44720458984375, -0.428985595703125, -0.4107666015625, -0.392547607421875, -0.37432861328125, -0.356109619140625, -0.337890625, -0.319671630859375, -0.30145263671875, -0.283233642578125, -0.2650146484375, -0.246795654296875, -0.22857666015625, -0.210357666015625, -0.192138671875, -0.173919677734375, -0.15570068359375, -0.137481689453125, -0.1192626953125, -0.101043701171875, -0.08282470703125, -0.064605712890625, -0.04638671875, -0.028167724609375, -0.00994873046875, 0.008270263671875, 0.0264892578125, 0.044708251953125, 0.06292724609375, 0.081146240234375, 0.099365234375, 0.117584228515625, 0.13580322265625, 0.154022216796875, 0.1722412109375, 0.190460205078125, 0.20867919921875, 0.226898193359375, 0.2451171875, 0.263336181640625, 0.28155517578125, 0.299774169921875, 0.3179931640625, 0.336212158203125, 0.35443115234375, 0.372650146484375, 0.390869140625, 0.409088134765625, 0.42730712890625, 0.445526123046875, 0.4637451171875, 0.481964111328125, 0.50018310546875, 0.518402099609375, 0.53662109375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 6.0, 16.0, 33.0, 89.0, 187.0, 248.0, 197.0, 106.0, 56.0, 29.0, 14.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.91811752319336, -8.7090482711792, -8.499978065490723, -8.290908813476562, -8.081838607788086, -7.872769355773926, -7.663699626922607, -7.454629898071289, -7.245560646057129, -7.0364909172058105, -6.827421188354492, -6.618351936340332, -6.409282207489014, -6.200212478637695, -5.991142749786377, -5.782073020935059, -5.57300329208374, -5.363933563232422, -5.1548638343811035, -4.945794105529785, -4.736724853515625, -4.527655124664307, -4.318585395812988, -4.10951566696167, -3.9004461765289307, -3.6913764476776123, -3.482306957244873, -3.2732372283935547, -3.0641674995422363, -2.855098009109497, -2.6460282802581787, -2.4369587898254395, -2.2278895378112793, -2.018819808959961, -1.8097503185272217, -1.6006805896759033, -1.3916109800338745, -1.1825413703918457, -0.9734716415405273, -0.7644020318984985, -0.5553324222564697, -0.34626278281211853, -0.13719314336776733, 0.07187652587890625, 0.28094613552093506, 0.49001574516296387, 0.6990854740142822, 0.908155083656311, 1.1172246932983398, 1.3262943029403687, 1.5353639125823975, 1.7444336414337158, 1.9535032510757446, 2.1625728607177734, 2.371642589569092, 2.58071231842041, 2.7897818088531494, 2.9988515377044678, 3.207921028137207, 3.4169907569885254, 3.6260604858398438, 3.835129976272583, 4.0441999435424805, 4.253269195556641, 4.462338924407959]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 8.0, 5.0, 4.0, 4.0, 4.0, 15.0, 12.0, 13.0, 19.0, 18.0, 21.0, 28.0, 32.0, 25.0, 34.0, 29.0, 42.0, 47.0, 44.0, 32.0, 40.0, 33.0, 54.0, 45.0, 39.0, 35.0, 30.0, 30.0, 46.0, 26.0, 31.0, 24.0, 21.0, 21.0, 19.0, 13.0, 13.0, 5.0, 8.0, 6.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5522117614746094, -1.4958521127700806, -1.4394924640655518, -1.383132815361023, -1.3267731666564941, -1.2704136371612549, -1.214053988456726, -1.1576943397521973, -1.1013346910476685, -1.0449750423431396, -0.9886153936386108, -0.9322558045387268, -0.875896155834198, -0.8195365071296692, -0.7631769180297852, -0.7068172693252563, -0.6504576206207275, -0.5940979719161987, -0.5377383232116699, -0.4813787341117859, -0.4250190854072571, -0.36865943670272827, -0.31229981780052185, -0.25594019889831543, -0.19958055019378662, -0.143220916390419, -0.08686128258705139, -0.030501648783683777, 0.025857985019683838, 0.08221763372421265, 0.13857725262641907, 0.1949368715286255, 0.2512965202331543, 0.3076561689376831, 0.3640157878398895, 0.42037540674209595, 0.47673505544662476, 0.5330947041511536, 0.5894542932510376, 0.6458139419555664, 0.7021735906600952, 0.758533239364624, 0.8148928880691528, 0.8712524771690369, 0.9276121258735657, 0.9839717745780945, 1.0403313636779785, 1.0966910123825073, 1.1530506610870361, 1.209410309791565, 1.2657699584960938, 1.3221296072006226, 1.3784892559051514, 1.4348487854003906, 1.4912084341049194, 1.5475680828094482, 1.603927731513977, 1.6602873802185059, 1.7166470289230347, 1.7730066776275635, 1.8293662071228027, 1.885725975036621, 1.9420855045318604, 1.9984451532363892, 2.054804801940918]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 5.0, 6.0, 14.0, 18.0, 32.0, 41.0, 60.0, 94.0, 138.0, 264.0, 425.0, 691.0, 1287.0, 2424.0, 4397.0, 8369.0, 16706.0, 33816.0, 72163.0, 152163.0, 268140.0, 242704.0, 127009.0, 59805.0, 28312.0, 13904.0, 7099.0, 3689.0, 2033.0, 1107.0, 638.0, 396.0, 216.0, 131.0, 104.0, 56.0, 32.0, 24.0, 13.0, 13.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2132568359375, -0.2067699432373047, -0.20028305053710938, -0.19379615783691406, -0.18730926513671875, -0.18082237243652344, -0.17433547973632812, -0.1678485870361328, -0.1613616943359375, -0.1548748016357422, -0.14838790893554688, -0.14190101623535156, -0.13541412353515625, -0.12892723083496094, -0.12244033813476562, -0.11595344543457031, -0.109466552734375, -0.10297966003417969, -0.09649276733398438, -0.09000587463378906, -0.08351898193359375, -0.07703208923339844, -0.07054519653320312, -0.06405830383300781, -0.0575714111328125, -0.05108451843261719, -0.044597625732421875, -0.03811073303222656, -0.03162384033203125, -0.025136947631835938, -0.018650054931640625, -0.012163162231445312, -0.00567626953125, 0.0008106231689453125, 0.007297515869140625, 0.013784408569335938, 0.02027130126953125, 0.026758193969726562, 0.033245086669921875, 0.03973197937011719, 0.0462188720703125, 0.05270576477050781, 0.059192657470703125, 0.06567955017089844, 0.07216644287109375, 0.07865333557128906, 0.08514022827148438, 0.09162712097167969, 0.098114013671875, 0.10460090637207031, 0.11108779907226562, 0.11757469177246094, 0.12406158447265625, 0.13054847717285156, 0.13703536987304688, 0.1435222625732422, 0.1500091552734375, 0.1564960479736328, 0.16298294067382812, 0.16946983337402344, 0.17595672607421875, 0.18244361877441406, 0.18893051147460938, 0.1954174041748047, 0.201904296875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 5.0, 2.0, 9.0, 2.0, 8.0, 11.0, 8.0, 18.0, 8.0, 19.0, 20.0, 25.0, 29.0, 22.0, 40.0, 49.0, 60.0, 37.0, 52.0, 48.0, 57.0, 39.0, 50.0, 47.0, 49.0, 38.0, 37.0, 33.0, 36.0, 28.0, 21.0, 22.0, 15.0, 8.0, 12.0, 6.0, 7.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2037353515625, -0.1976165771484375, -0.191497802734375, -0.1853790283203125, -0.17926025390625, -0.1731414794921875, -0.167022705078125, -0.1609039306640625, -0.15478515625, -0.1486663818359375, -0.142547607421875, -0.1364288330078125, -0.13031005859375, -0.1241912841796875, -0.118072509765625, -0.1119537353515625, -0.1058349609375, -0.0997161865234375, -0.093597412109375, -0.0874786376953125, -0.08135986328125, -0.0752410888671875, -0.069122314453125, -0.0630035400390625, -0.056884765625, -0.0507659912109375, -0.044647216796875, -0.0385284423828125, -0.03240966796875, -0.0262908935546875, -0.020172119140625, -0.0140533447265625, -0.0079345703125, -0.0018157958984375, 0.004302978515625, 0.0104217529296875, 0.01654052734375, 0.0226593017578125, 0.028778076171875, 0.0348968505859375, 0.041015625, 0.0471343994140625, 0.053253173828125, 0.0593719482421875, 0.06549072265625, 0.0716094970703125, 0.077728271484375, 0.0838470458984375, 0.0899658203125, 0.0960845947265625, 0.102203369140625, 0.1083221435546875, 0.11444091796875, 0.1205596923828125, 0.126678466796875, 0.1327972412109375, 0.138916015625, 0.1450347900390625, 0.151153564453125, 0.1572723388671875, 0.16339111328125, 0.1695098876953125, 0.175628662109375, 0.1817474365234375, 0.1878662109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 3.0, 7.0, 10.0, 8.0, 11.0, 21.0, 24.0, 35.0, 60.0, 91.0, 165.0, 268.0, 613.0, 1247.0, 3519.0, 15864.0, 142936.0, 787803.0, 80453.0, 10605.0, 2607.0, 979.0, 504.0, 244.0, 170.0, 111.0, 61.0, 35.0, 18.0, 17.0, 19.0, 12.0, 11.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6674041748046875, -0.643890380859375, -0.6203765869140625, -0.59686279296875, -0.5733489990234375, -0.549835205078125, -0.5263214111328125, -0.5028076171875, -0.4792938232421875, -0.455780029296875, -0.4322662353515625, -0.40875244140625, -0.3852386474609375, -0.361724853515625, -0.3382110595703125, -0.314697265625, -0.2911834716796875, -0.267669677734375, -0.2441558837890625, -0.22064208984375, -0.1971282958984375, -0.173614501953125, -0.1501007080078125, -0.1265869140625, -0.1030731201171875, -0.079559326171875, -0.0560455322265625, -0.03253173828125, -0.0090179443359375, 0.014495849609375, 0.0380096435546875, 0.0615234375, 0.0850372314453125, 0.108551025390625, 0.1320648193359375, 0.15557861328125, 0.1790924072265625, 0.202606201171875, 0.2261199951171875, 0.2496337890625, 0.2731475830078125, 0.296661376953125, 0.3201751708984375, 0.34368896484375, 0.3672027587890625, 0.390716552734375, 0.4142303466796875, 0.437744140625, 0.4612579345703125, 0.484771728515625, 0.5082855224609375, 0.53179931640625, 0.5553131103515625, 0.578826904296875, 0.6023406982421875, 0.6258544921875, 0.6493682861328125, 0.672882080078125, 0.6963958740234375, 0.71990966796875, 0.7434234619140625, 0.766937255859375, 0.7904510498046875, 0.81396484375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 5.0, 15.0, 9.0, 17.0, 20.0, 38.0, 43.0, 44.0, 55.0, 62.0, 71.0, 71.0, 67.0, 93.0, 67.0, 68.0, 66.0, 43.0, 34.0, 20.0, 22.0, 12.0, 14.0, 12.0, 9.0, 9.0, 3.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28125, -1.2443389892578125, -1.207427978515625, -1.1705169677734375, -1.13360595703125, -1.0966949462890625, -1.059783935546875, -1.0228729248046875, -0.9859619140625, -0.9490509033203125, -0.912139892578125, -0.8752288818359375, -0.83831787109375, -0.8014068603515625, -0.764495849609375, -0.7275848388671875, -0.690673828125, -0.6537628173828125, -0.616851806640625, -0.5799407958984375, -0.54302978515625, -0.5061187744140625, -0.469207763671875, -0.4322967529296875, -0.3953857421875, -0.3584747314453125, -0.321563720703125, -0.2846527099609375, -0.24774169921875, -0.2108306884765625, -0.173919677734375, -0.1370086669921875, -0.10009765625, -0.0631866455078125, -0.026275634765625, 0.0106353759765625, 0.04754638671875, 0.0844573974609375, 0.121368408203125, 0.1582794189453125, 0.1951904296875, 0.2321014404296875, 0.269012451171875, 0.3059234619140625, 0.34283447265625, 0.3797454833984375, 0.416656494140625, 0.4535675048828125, 0.490478515625, 0.5273895263671875, 0.564300537109375, 0.6012115478515625, 0.63812255859375, 0.6750335693359375, 0.711944580078125, 0.7488555908203125, 0.7857666015625, 0.8226776123046875, 0.859588623046875, 0.8964996337890625, 0.93341064453125, 0.9703216552734375, 1.007232666015625, 1.0441436767578125, 1.0810546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 4.0, 8.0, 13.0, 14.0, 31.0, 44.0, 79.0, 104.0, 226.0, 540.0, 1367.0, 4611.0, 22044.0, 179096.0, 768562.0, 58013.0, 9825.0, 2369.0, 847.0, 315.0, 169.0, 97.0, 65.0, 37.0, 24.0, 18.0, 17.0, 8.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281005859375, -0.27140045166015625, -0.2617950439453125, -0.25218963623046875, -0.242584228515625, -0.23297882080078125, -0.2233734130859375, -0.21376800537109375, -0.20416259765625, -0.19455718994140625, -0.1849517822265625, -0.17534637451171875, -0.165740966796875, -0.15613555908203125, -0.1465301513671875, -0.13692474365234375, -0.1273193359375, -0.11771392822265625, -0.1081085205078125, -0.09850311279296875, -0.088897705078125, -0.07929229736328125, -0.0696868896484375, -0.06008148193359375, -0.05047607421875, -0.04087066650390625, -0.0312652587890625, -0.02165985107421875, -0.012054443359375, -0.00244903564453125, 0.0071563720703125, 0.01676177978515625, 0.0263671875, 0.03597259521484375, 0.0455780029296875, 0.05518341064453125, 0.064788818359375, 0.07439422607421875, 0.0839996337890625, 0.09360504150390625, 0.10321044921875, 0.11281585693359375, 0.1224212646484375, 0.13202667236328125, 0.141632080078125, 0.15123748779296875, 0.1608428955078125, 0.17044830322265625, 0.1800537109375, 0.18965911865234375, 0.1992645263671875, 0.20886993408203125, 0.218475341796875, 0.22808074951171875, 0.2376861572265625, 0.24729156494140625, 0.25689697265625, 0.26650238037109375, 0.2761077880859375, 0.28571319580078125, 0.295318603515625, 0.30492401123046875, 0.3145294189453125, 0.32413482666015625, 0.333740234375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 13.0, 22.0, 19.0, 40.0, 47.0, 79.0, 142.0, 192.0, 167.0, 96.0, 56.0, 31.0, 31.0, 13.0, 7.0, 6.0, 7.0, 8.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010383129119873047, -0.00010006874799728394, -9.63062047958374e-05, -9.254366159439087e-05, -8.878111839294434e-05, -8.50185751914978e-05, -8.125603199005127e-05, -7.749348878860474e-05, -7.37309455871582e-05, -6.996840238571167e-05, -6.620585918426514e-05, -6.24433159828186e-05, -5.868077278137207e-05, -5.491822957992554e-05, -5.1155686378479004e-05, -4.739314317703247e-05, -4.363059997558594e-05, -3.9868056774139404e-05, -3.610551357269287e-05, -3.234297037124634e-05, -2.8580427169799805e-05, -2.481788396835327e-05, -2.1055340766906738e-05, -1.7292797565460205e-05, -1.3530254364013672e-05, -9.767711162567139e-06, -6.0051679611206055e-06, -2.2426247596740723e-06, 1.519918441772461e-06, 5.282461643218994e-06, 9.045004844665527e-06, 1.280754804611206e-05, 1.6570091247558594e-05, 2.0332634449005127e-05, 2.409517765045166e-05, 2.7857720851898193e-05, 3.1620264053344727e-05, 3.538280725479126e-05, 3.914535045623779e-05, 4.2907893657684326e-05, 4.667043685913086e-05, 5.043298006057739e-05, 5.4195523262023926e-05, 5.795806646347046e-05, 6.172060966491699e-05, 6.548315286636353e-05, 6.924569606781006e-05, 7.300823926925659e-05, 7.677078247070312e-05, 8.053332567214966e-05, 8.429586887359619e-05, 8.805841207504272e-05, 9.182095527648926e-05, 9.558349847793579e-05, 9.934604167938232e-05, 0.00010310858488082886, 0.00010687112808227539, 0.00011063367128372192, 0.00011439621448516846, 0.00011815875768661499, 0.00012192130088806152, 0.00012568384408950806, 0.0001294463872909546, 0.00013320893049240112, 0.00013697147369384766]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 9.0, 14.0, 21.0, 17.0, 39.0, 56.0, 94.0, 134.0, 244.0, 417.0, 726.0, 1491.0, 3990.0, 12467.0, 54129.0, 588635.0, 321818.0, 46519.0, 10987.0, 3525.0, 1520.0, 708.0, 380.0, 196.0, 127.0, 83.0, 45.0, 42.0, 31.0, 8.0, 12.0, 18.0, 12.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.26416015625, -0.25681304931640625, -0.2494659423828125, -0.24211883544921875, -0.234771728515625, -0.22742462158203125, -0.2200775146484375, -0.21273040771484375, -0.20538330078125, -0.19803619384765625, -0.1906890869140625, -0.18334197998046875, -0.175994873046875, -0.16864776611328125, -0.1613006591796875, -0.15395355224609375, -0.1466064453125, -0.13925933837890625, -0.1319122314453125, -0.12456512451171875, -0.117218017578125, -0.10987091064453125, -0.1025238037109375, -0.09517669677734375, -0.08782958984375, -0.08048248291015625, -0.0731353759765625, -0.06578826904296875, -0.058441162109375, -0.05109405517578125, -0.0437469482421875, -0.03639984130859375, -0.029052734375, -0.02170562744140625, -0.0143585205078125, -0.00701141357421875, 0.000335693359375, 0.00768280029296875, 0.0150299072265625, 0.02237701416015625, 0.02972412109375, 0.03707122802734375, 0.0444183349609375, 0.05176544189453125, 0.059112548828125, 0.06645965576171875, 0.0738067626953125, 0.08115386962890625, 0.0885009765625, 0.09584808349609375, 0.1031951904296875, 0.11054229736328125, 0.117889404296875, 0.12523651123046875, 0.1325836181640625, 0.13993072509765625, 0.14727783203125, 0.15462493896484375, 0.1619720458984375, 0.16931915283203125, 0.176666259765625, 0.18401336669921875, 0.1913604736328125, 0.19870758056640625, 0.2060546875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 1.0, 10.0, 12.0, 17.0, 28.0, 33.0, 59.0, 61.0, 95.0, 101.0, 132.0, 109.0, 92.0, 82.0, 48.0, 28.0, 25.0, 24.0, 8.0, 10.0, 5.0, 6.0, 2.0, 0.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.23291015625, -0.22478485107421875, -0.2166595458984375, -0.20853424072265625, -0.200408935546875, -0.19228363037109375, -0.1841583251953125, -0.17603302001953125, -0.16790771484375, -0.15978240966796875, -0.1516571044921875, -0.14353179931640625, -0.135406494140625, -0.12728118896484375, -0.1191558837890625, -0.11103057861328125, -0.1029052734375, -0.09477996826171875, -0.0866546630859375, -0.07852935791015625, -0.070404052734375, -0.06227874755859375, -0.0541534423828125, -0.04602813720703125, -0.03790283203125, -0.02977752685546875, -0.0216522216796875, -0.01352691650390625, -0.005401611328125, 0.00272369384765625, 0.0108489990234375, 0.01897430419921875, 0.027099609375, 0.03522491455078125, 0.0433502197265625, 0.05147552490234375, 0.059600830078125, 0.06772613525390625, 0.0758514404296875, 0.08397674560546875, 0.09210205078125, 0.10022735595703125, 0.1083526611328125, 0.11647796630859375, 0.124603271484375, 0.13272857666015625, 0.1408538818359375, 0.14897918701171875, 0.1571044921875, 0.16522979736328125, 0.1733551025390625, 0.18148040771484375, 0.189605712890625, 0.19773101806640625, 0.2058563232421875, 0.21398162841796875, 0.22210693359375, 0.23023223876953125, 0.2383575439453125, 0.24648284912109375, 0.254608154296875, 0.26273345947265625, 0.2708587646484375, 0.27898406982421875, 0.287109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 11.0, 23.0, 41.0, 86.0, 152.0, 334.0, 149.0, 93.0, 54.0, 27.0, 8.0, 8.0, 5.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.079084396362305, -5.908647060394287, -5.7382097244262695, -5.56777286529541, -5.397335529327393, -5.226898193359375, -5.056460857391357, -4.88602352142334, -4.7155866622924805, -4.545149326324463, -4.374711990356445, -4.204275131225586, -4.033837795257568, -3.863400459289551, -3.692963123321533, -3.5225257873535156, -3.352088451385498, -3.1816511154174805, -3.011214017868042, -2.8407766819000244, -2.670339584350586, -2.4999022483825684, -2.329464912414551, -2.159027576446533, -1.9885904788970947, -1.8181532621383667, -1.6477160453796387, -1.477278709411621, -1.306841492652893, -1.136404275894165, -0.9659669399261475, -0.7955297231674194, -0.6250920295715332, -0.4546547830104828, -0.2842175364494324, -0.11378026008605957, 0.05665695667266846, 0.22709417343139648, 0.39753150939941406, 0.5679687261581421, 0.7384059429168701, 0.9088431596755981, 1.0792803764343262, 1.2497177124023438, 1.4201549291610718, 1.5905921459197998, 1.7610294818878174, 1.9314666986465454, 2.1019039154052734, 2.272341251373291, 2.4427783489227295, 2.613215684890747, 2.7836527824401855, 2.954090118408203, 3.1245274543762207, 3.2949647903442383, 3.4654018878936768, 3.6358392238616943, 3.806276321411133, 3.9767136573791504, 4.147150993347168, 4.317587852478027, 4.488025665283203, 4.6584625244140625, 4.82889986038208]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 8.0, 9.0, 7.0, 13.0, 10.0, 17.0, 18.0, 10.0, 29.0, 23.0, 26.0, 23.0, 33.0, 42.0, 41.0, 48.0, 63.0, 123.0, 99.0, 51.0, 44.0, 41.0, 32.0, 23.0, 21.0, 26.0, 18.0, 22.0, 12.0, 18.0, 7.0, 7.0, 14.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-4.281179428100586, -4.153486728668213, -4.02579402923584, -3.898101568222046, -3.770409107208252, -3.642716407775879, -3.515023708343506, -3.387331008911133, -3.259638547897339, -3.131945848464966, -3.004253387451172, -2.876560688018799, -2.748867988586426, -2.621175527572632, -2.493482828140259, -2.365790367126465, -2.238097667694092, -2.1104049682617188, -1.9827125072479248, -1.8550198078155518, -1.7273272275924683, -1.5996346473693848, -1.4719419479370117, -1.3442493677139282, -1.2165567874908447, -1.0888642072677612, -0.961171567440033, -0.8334789276123047, -0.7057863473892212, -0.5780937671661377, -0.4504011273384094, -0.32270848751068115, -0.19501638412475586, -0.06732377409934998, 0.06036883592605591, 0.1880614459514618, 0.3157540559768677, 0.44344663619995117, 0.5711392760276794, 0.6988319158554077, 0.8265244960784912, 0.9542170763015747, 1.0819096565246582, 1.2096023559570312, 1.3372949361801147, 1.4649875164031982, 1.5926802158355713, 1.7203727960586548, 1.8480653762817383, 1.9757579565048218, 2.1034505367279053, 2.2311432361602783, 2.3588356971740723, 2.4865283966064453, 2.6142210960388184, 2.7419137954711914, 2.8696062564849854, 2.9972989559173584, 3.1249914169311523, 3.2526841163635254, 3.3803768157958984, 3.5080692768096924, 3.6357619762420654, 3.7634544372558594, 3.8911471366882324]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 14.0, 12.0, 17.0, 26.0, 42.0, 48.0, 73.0, 100.0, 133.0, 233.0, 315.0, 495.0, 792.0, 1360.0, 2782.0, 6520.0, 24877.0, 519973.0, 3422504.0, 186781.0, 16557.0, 5123.0, 2344.0, 1150.0, 706.0, 439.0, 285.0, 195.0, 105.0, 86.0, 46.0, 43.0, 25.0, 21.0, 10.0, 16.0, 6.0, 1.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.57958984375, -0.5636520385742188, -0.5477142333984375, -0.5317764282226562, -0.515838623046875, -0.49990081787109375, -0.4839630126953125, -0.46802520751953125, -0.45208740234375, -0.43614959716796875, -0.4202117919921875, -0.40427398681640625, -0.388336181640625, -0.37239837646484375, -0.3564605712890625, -0.34052276611328125, -0.3245849609375, -0.30864715576171875, -0.2927093505859375, -0.27677154541015625, -0.260833740234375, -0.24489593505859375, -0.2289581298828125, -0.21302032470703125, -0.19708251953125, -0.18114471435546875, -0.1652069091796875, -0.14926910400390625, -0.133331298828125, -0.11739349365234375, -0.1014556884765625, -0.08551788330078125, -0.069580078125, -0.05364227294921875, -0.0377044677734375, -0.02176666259765625, -0.005828857421875, 0.01010894775390625, 0.0260467529296875, 0.04198455810546875, 0.05792236328125, 0.07386016845703125, 0.0897979736328125, 0.10573577880859375, 0.121673583984375, 0.13761138916015625, 0.1535491943359375, 0.16948699951171875, 0.1854248046875, 0.20136260986328125, 0.2173004150390625, 0.23323822021484375, 0.249176025390625, 0.26511383056640625, 0.2810516357421875, 0.29698944091796875, 0.31292724609375, 0.32886505126953125, 0.3448028564453125, 0.36074066162109375, 0.376678466796875, 0.39261627197265625, 0.4085540771484375, 0.42449188232421875, 0.4404296875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 9.0, 1.0, 4.0, 4.0, 8.0, 9.0, 5.0, 9.0, 13.0, 17.0, 13.0, 25.0, 22.0, 21.0, 30.0, 44.0, 36.0, 51.0, 32.0, 50.0, 52.0, 45.0, 56.0, 52.0, 38.0, 36.0, 55.0, 48.0, 34.0, 36.0, 24.0, 22.0, 26.0, 19.0, 19.0, 8.0, 10.0, 7.0, 4.0, 6.0, 4.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1849365234375, -0.1794719696044922, -0.17400741577148438, -0.16854286193847656, -0.16307830810546875, -0.15761375427246094, -0.15214920043945312, -0.1466846466064453, -0.1412200927734375, -0.1357555389404297, -0.13029098510742188, -0.12482643127441406, -0.11936187744140625, -0.11389732360839844, -0.10843276977539062, -0.10296821594238281, -0.097503662109375, -0.09203910827636719, -0.08657455444335938, -0.08111000061035156, -0.07564544677734375, -0.07018089294433594, -0.06471633911132812, -0.05925178527832031, -0.0537872314453125, -0.04832267761230469, -0.042858123779296875, -0.03739356994628906, -0.03192901611328125, -0.026464462280273438, -0.020999908447265625, -0.015535354614257812, -0.01007080078125, -0.0046062469482421875, 0.000858306884765625, 0.0063228607177734375, 0.01178741455078125, 0.017251968383789062, 0.022716522216796875, 0.028181076049804688, 0.0336456298828125, 0.03911018371582031, 0.044574737548828125, 0.05003929138183594, 0.05550384521484375, 0.06096839904785156, 0.06643295288085938, 0.07189750671386719, 0.077362060546875, 0.08282661437988281, 0.08829116821289062, 0.09375572204589844, 0.09922027587890625, 0.10468482971191406, 0.11014938354492188, 0.11561393737792969, 0.1210784912109375, 0.1265430450439453, 0.13200759887695312, 0.13747215270996094, 0.14293670654296875, 0.14840126037597656, 0.15386581420898438, 0.1593303680419922, 0.164794921875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 4.0, 6.0, 6.0, 12.0, 19.0, 27.0, 69.0, 146.0, 379.0, 1290.0, 8075.0, 1372931.0, 2799767.0, 9103.0, 1546.0, 506.0, 193.0, 101.0, 42.0, 27.0, 8.0, 11.0, 2.0, 7.0, 7.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.98046875, -1.9322052001953125, -1.883941650390625, -1.8356781005859375, -1.78741455078125, -1.7391510009765625, -1.690887451171875, -1.6426239013671875, -1.5943603515625, -1.5460968017578125, -1.497833251953125, -1.4495697021484375, -1.40130615234375, -1.3530426025390625, -1.304779052734375, -1.2565155029296875, -1.208251953125, -1.1599884033203125, -1.111724853515625, -1.0634613037109375, -1.01519775390625, -0.9669342041015625, -0.918670654296875, -0.8704071044921875, -0.8221435546875, -0.7738800048828125, -0.725616455078125, -0.6773529052734375, -0.62908935546875, -0.5808258056640625, -0.532562255859375, -0.4842987060546875, -0.43603515625, -0.3877716064453125, -0.339508056640625, -0.2912445068359375, -0.24298095703125, -0.1947174072265625, -0.146453857421875, -0.0981903076171875, -0.0499267578125, -0.0016632080078125, 0.046600341796875, 0.0948638916015625, 0.14312744140625, 0.1913909912109375, 0.239654541015625, 0.2879180908203125, 0.336181640625, 0.3844451904296875, 0.432708740234375, 0.4809722900390625, 0.52923583984375, 0.5774993896484375, 0.625762939453125, 0.6740264892578125, 0.7222900390625, 0.7705535888671875, 0.818817138671875, 0.8670806884765625, 0.91534423828125, 0.9636077880859375, 1.011871337890625, 1.0601348876953125, 1.1083984375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 4.0, 9.0, 7.0, 12.0, 20.0, 29.0, 54.0, 79.0, 161.0, 359.0, 861.0, 1127.0, 701.0, 313.0, 149.0, 71.0, 46.0, 21.0, 11.0, 11.0, 9.0, 4.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67724609375, -0.6541595458984375, -0.631072998046875, -0.6079864501953125, -0.58489990234375, -0.5618133544921875, -0.538726806640625, -0.5156402587890625, -0.4925537109375, -0.4694671630859375, -0.446380615234375, -0.4232940673828125, -0.40020751953125, -0.3771209716796875, -0.354034423828125, -0.3309478759765625, -0.307861328125, -0.2847747802734375, -0.261688232421875, -0.2386016845703125, -0.21551513671875, -0.1924285888671875, -0.169342041015625, -0.1462554931640625, -0.1231689453125, -0.1000823974609375, -0.076995849609375, -0.0539093017578125, -0.03082275390625, -0.0077362060546875, 0.015350341796875, 0.0384368896484375, 0.0615234375, 0.0846099853515625, 0.107696533203125, 0.1307830810546875, 0.15386962890625, 0.1769561767578125, 0.200042724609375, 0.2231292724609375, 0.2462158203125, 0.2693023681640625, 0.292388916015625, 0.3154754638671875, 0.33856201171875, 0.3616485595703125, 0.384735107421875, 0.4078216552734375, 0.430908203125, 0.4539947509765625, 0.477081298828125, 0.5001678466796875, 0.52325439453125, 0.5463409423828125, 0.569427490234375, 0.5925140380859375, 0.6156005859375, 0.6386871337890625, 0.661773681640625, 0.6848602294921875, 0.70794677734375, 0.7310333251953125, 0.754119873046875, 0.7772064208984375, 0.80029296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 20.0, 23.0, 46.0, 94.0, 149.0, 159.0, 200.0, 118.0, 86.0, 40.0, 22.0, 11.0, 15.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.961183071136475, -4.794564247131348, -4.6279449462890625, -4.461325645446777, -4.29470682144165, -4.128087997436523, -3.9614686965942383, -3.7948496341705322, -3.628230571746826, -3.46161150932312, -3.294992446899414, -3.128373384475708, -2.961754322052002, -2.795135259628296, -2.62851619720459, -2.461897134780884, -2.2952780723571777, -2.1286590099334717, -1.9620399475097656, -1.7954208850860596, -1.6288018226623535, -1.4621827602386475, -1.2955636978149414, -1.1289446353912354, -0.9623255729675293, -0.7957065105438232, -0.6290874481201172, -0.46246838569641113, -0.2958493232727051, -0.12923026084899902, 0.03738880157470703, 0.20400786399841309, 0.37062644958496094, 0.537245512008667, 0.703864574432373, 0.8704836368560791, 1.0371026992797852, 1.2037217617034912, 1.3703408241271973, 1.5369598865509033, 1.7035789489746094, 1.8701980113983154, 2.0368170738220215, 2.2034361362457275, 2.3700551986694336, 2.5366742610931396, 2.7032933235168457, 2.8699123859405518, 3.036531448364258, 3.203150510787964, 3.36976957321167, 3.536388635635376, 3.703007698059082, 3.869626760482788, 4.036245822906494, 4.202864646911621, 4.369483947753906, 4.536103248596191, 4.702722072601318, 4.869340896606445, 5.0359601974487305, 5.202579498291016, 5.369198322296143, 5.5358171463012695, 5.702436447143555]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 7.0, 9.0, 11.0, 12.0, 13.0, 10.0, 12.0, 20.0, 15.0, 22.0, 24.0, 28.0, 41.0, 31.0, 40.0, 43.0, 53.0, 49.0, 48.0, 39.0, 46.0, 33.0, 33.0, 50.0, 39.0, 46.0, 31.0, 25.0, 20.0, 23.0, 10.0, 21.0, 16.0, 14.0, 15.0, 7.0, 12.0, 7.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.9066424369812012, -1.8431117534637451, -1.779581069946289, -1.716050386428833, -1.652519702911377, -1.588989019393921, -1.5254584550857544, -1.4619277715682983, -1.3983970880508423, -1.3348664045333862, -1.2713357210159302, -1.2078050374984741, -1.1442744731903076, -1.0807437896728516, -1.0172131061553955, -0.9536824226379395, -0.8901517391204834, -0.8266210556030273, -0.7630903720855713, -0.69955974817276, -0.636029064655304, -0.5724983811378479, -0.5089677572250366, -0.44543707370758057, -0.3819063901901245, -0.31837570667266846, -0.2548450529575348, -0.19131438434123993, -0.12778371572494507, -0.06425303220748901, -0.0007223784923553467, 0.06280827522277832, 0.12633895874023438, 0.18986962735652924, 0.2534002959728241, 0.31693094968795776, 0.3804616332054138, 0.4439923167228699, 0.5075229406356812, 0.5710536241531372, 0.6345843076705933, 0.6981149911880493, 0.7616456747055054, 0.8251762986183167, 0.8887069821357727, 0.9522376656532288, 1.01576828956604, 1.079298973083496, 1.1428296566009521, 1.2063603401184082, 1.2698910236358643, 1.3334217071533203, 1.3969523906707764, 1.4604830741882324, 1.524013638496399, 1.587544322013855, 1.651075005531311, 1.714605689048767, 1.7781363725662231, 1.8416670560836792, 1.9051976203918457, 1.9687283039093018, 2.032258987426758, 2.095789670944214, 2.15932035446167]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 4.0, 5.0, 5.0, 10.0, 8.0, 11.0, 14.0, 34.0, 43.0, 48.0, 95.0, 120.0, 224.0, 354.0, 580.0, 936.0, 1692.0, 2844.0, 5344.0, 10169.0, 20399.0, 43810.0, 103982.0, 256796.0, 328749.0, 153196.0, 61947.0, 27913.0, 13394.0, 7066.0, 3655.0, 2071.0, 1200.0, 666.0, 425.0, 264.0, 162.0, 111.0, 65.0, 39.0, 29.0, 27.0, 17.0, 9.0, 10.0, 8.0, 4.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-0.3291015625, -0.31948089599609375, -0.3098602294921875, -0.30023956298828125, -0.290618896484375, -0.28099822998046875, -0.2713775634765625, -0.26175689697265625, -0.25213623046875, -0.24251556396484375, -0.2328948974609375, -0.22327423095703125, -0.213653564453125, -0.20403289794921875, -0.1944122314453125, -0.18479156494140625, -0.1751708984375, -0.16555023193359375, -0.1559295654296875, -0.14630889892578125, -0.136688232421875, -0.12706756591796875, -0.1174468994140625, -0.10782623291015625, -0.09820556640625, -0.08858489990234375, -0.0789642333984375, -0.06934356689453125, -0.059722900390625, -0.05010223388671875, -0.0404815673828125, -0.03086090087890625, -0.021240234375, -0.01161956787109375, -0.0019989013671875, 0.00762176513671875, 0.017242431640625, 0.02686309814453125, 0.0364837646484375, 0.04610443115234375, 0.05572509765625, 0.06534576416015625, 0.0749664306640625, 0.08458709716796875, 0.094207763671875, 0.10382843017578125, 0.1134490966796875, 0.12306976318359375, 0.1326904296875, 0.14231109619140625, 0.1519317626953125, 0.16155242919921875, 0.171173095703125, 0.18079376220703125, 0.1904144287109375, 0.20003509521484375, 0.20965576171875, 0.21927642822265625, 0.2288970947265625, 0.23851776123046875, 0.248138427734375, 0.25775909423828125, 0.2673797607421875, 0.27700042724609375, 0.28662109375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 2.0, 1.0, 5.0, 6.0, 7.0, 7.0, 23.0, 8.0, 18.0, 19.0, 22.0, 21.0, 28.0, 24.0, 32.0, 39.0, 32.0, 34.0, 59.0, 57.0, 45.0, 46.0, 56.0, 42.0, 57.0, 37.0, 31.0, 37.0, 39.0, 36.0, 27.0, 19.0, 20.0, 15.0, 11.0, 10.0, 7.0, 3.0, 4.0, 6.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.183837890625, -0.17787551879882812, -0.17191314697265625, -0.16595077514648438, -0.1599884033203125, -0.15402603149414062, -0.14806365966796875, -0.14210128784179688, -0.136138916015625, -0.13017654418945312, -0.12421417236328125, -0.11825180053710938, -0.1122894287109375, -0.10632705688476562, -0.10036468505859375, -0.09440231323242188, -0.08843994140625, -0.08247756958007812, -0.07651519775390625, -0.07055282592773438, -0.0645904541015625, -0.058628082275390625, -0.05266571044921875, -0.046703338623046875, -0.040740966796875, -0.034778594970703125, -0.02881622314453125, -0.022853851318359375, -0.0168914794921875, -0.010929107666015625, -0.00496673583984375, 0.000995635986328125, 0.0069580078125, 0.012920379638671875, 0.01888275146484375, 0.024845123291015625, 0.0308074951171875, 0.036769866943359375, 0.04273223876953125, 0.048694610595703125, 0.054656982421875, 0.060619354248046875, 0.06658172607421875, 0.07254409790039062, 0.0785064697265625, 0.08446884155273438, 0.09043121337890625, 0.09639358520507812, 0.10235595703125, 0.10831832885742188, 0.11428070068359375, 0.12024307250976562, 0.1262054443359375, 0.13216781616210938, 0.13813018798828125, 0.14409255981445312, 0.150054931640625, 0.15601730346679688, 0.16197967529296875, 0.16794204711914062, 0.1739044189453125, 0.17986679077148438, 0.18582916259765625, 0.19179153442382812, 0.19775390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 12.0, 9.0, 13.0, 29.0, 31.0, 44.0, 71.0, 100.0, 128.0, 173.0, 250.0, 436.0, 692.0, 1322.0, 2954.0, 9999.0, 59192.0, 733098.0, 205170.0, 24836.0, 5451.0, 1953.0, 937.0, 530.0, 344.0, 247.0, 136.0, 109.0, 89.0, 52.0, 46.0, 27.0, 17.0, 15.0, 17.0, 5.0, 5.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69091796875, -0.6691741943359375, -0.647430419921875, -0.6256866455078125, -0.60394287109375, -0.5821990966796875, -0.560455322265625, -0.5387115478515625, -0.5169677734375, -0.4952239990234375, -0.473480224609375, -0.4517364501953125, -0.42999267578125, -0.4082489013671875, -0.386505126953125, -0.3647613525390625, -0.343017578125, -0.3212738037109375, -0.299530029296875, -0.2777862548828125, -0.25604248046875, -0.2342987060546875, -0.212554931640625, -0.1908111572265625, -0.1690673828125, -0.1473236083984375, -0.125579833984375, -0.1038360595703125, -0.08209228515625, -0.0603485107421875, -0.038604736328125, -0.0168609619140625, 0.0048828125, 0.0266265869140625, 0.048370361328125, 0.0701141357421875, 0.09185791015625, 0.1136016845703125, 0.135345458984375, 0.1570892333984375, 0.1788330078125, 0.2005767822265625, 0.222320556640625, 0.2440643310546875, 0.26580810546875, 0.2875518798828125, 0.309295654296875, 0.3310394287109375, 0.352783203125, 0.3745269775390625, 0.396270751953125, 0.4180145263671875, 0.43975830078125, 0.4615020751953125, 0.483245849609375, 0.5049896240234375, 0.5267333984375, 0.5484771728515625, 0.570220947265625, 0.5919647216796875, 0.61370849609375, 0.6354522705078125, 0.657196044921875, 0.6789398193359375, 0.70068359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 10.0, 3.0, 5.0, 5.0, 7.0, 12.0, 10.0, 16.0, 20.0, 29.0, 33.0, 45.0, 45.0, 38.0, 59.0, 52.0, 60.0, 57.0, 68.0, 58.0, 60.0, 57.0, 44.0, 48.0, 22.0, 21.0, 22.0, 19.0, 19.0, 12.0, 8.0, 12.0, 6.0, 5.0, 5.0, 5.0, 3.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64794921875, -0.6209030151367188, -0.5938568115234375, -0.5668106079101562, -0.539764404296875, -0.5127182006835938, -0.4856719970703125, -0.45862579345703125, -0.43157958984375, -0.40453338623046875, -0.3774871826171875, -0.35044097900390625, -0.323394775390625, -0.29634857177734375, -0.2693023681640625, -0.24225616455078125, -0.2152099609375, -0.18816375732421875, -0.1611175537109375, -0.13407135009765625, -0.107025146484375, -0.07997894287109375, -0.0529327392578125, -0.02588653564453125, 0.00115966796875, 0.02820587158203125, 0.0552520751953125, 0.08229827880859375, 0.109344482421875, 0.13639068603515625, 0.1634368896484375, 0.19048309326171875, 0.217529296875, 0.24457550048828125, 0.2716217041015625, 0.29866790771484375, 0.325714111328125, 0.35276031494140625, 0.3798065185546875, 0.40685272216796875, 0.43389892578125, 0.46094512939453125, 0.4879913330078125, 0.5150375366210938, 0.542083740234375, 0.5691299438476562, 0.5961761474609375, 0.6232223510742188, 0.6502685546875, 0.6773147583007812, 0.7043609619140625, 0.7314071655273438, 0.758453369140625, 0.7854995727539062, 0.8125457763671875, 0.8395919799804688, 0.86663818359375, 0.8936843872070312, 0.9207305908203125, 0.9477767944335938, 0.974822998046875, 1.0018692016601562, 1.0289154052734375, 1.0559616088867188, 1.0830078125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 8.0, 6.0, 5.0, 23.0, 16.0, 19.0, 24.0, 24.0, 55.0, 70.0, 112.0, 164.0, 315.0, 496.0, 913.0, 2184.0, 5485.0, 16739.0, 67301.0, 587454.0, 284937.0, 58115.0, 15131.0, 4815.0, 1940.0, 934.0, 444.0, 269.0, 189.0, 93.0, 79.0, 44.0, 33.0, 26.0, 17.0, 12.0, 12.0, 9.0, 8.0, 5.0, 8.0, 4.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1268310546875, -0.12244987487792969, -0.11806869506835938, -0.11368751525878906, -0.10930633544921875, -0.10492515563964844, -0.10054397583007812, -0.09616279602050781, -0.0917816162109375, -0.08740043640136719, -0.08301925659179688, -0.07863807678222656, -0.07425689697265625, -0.06987571716308594, -0.06549453735351562, -0.06111335754394531, -0.056732177734375, -0.05235099792480469, -0.047969818115234375, -0.04358863830566406, -0.03920745849609375, -0.03482627868652344, -0.030445098876953125, -0.026063919067382812, -0.0216827392578125, -0.017301559448242188, -0.012920379638671875, -0.008539199829101562, -0.00415802001953125, 0.0002231597900390625, 0.004604339599609375, 0.008985519409179688, 0.01336669921875, 0.017747879028320312, 0.022129058837890625, 0.026510238647460938, 0.03089141845703125, 0.03527259826660156, 0.039653778076171875, 0.04403495788574219, 0.0484161376953125, 0.05279731750488281, 0.057178497314453125, 0.06155967712402344, 0.06594085693359375, 0.07032203674316406, 0.07470321655273438, 0.07908439636230469, 0.083465576171875, 0.08784675598144531, 0.09222793579101562, 0.09660911560058594, 0.10099029541015625, 0.10537147521972656, 0.10975265502929688, 0.11413383483886719, 0.1185150146484375, 0.12289619445800781, 0.12727737426757812, 0.13165855407714844, 0.13603973388671875, 0.14042091369628906, 0.14480209350585938, 0.1491832733154297, 0.153564453125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 3.0, 4.0, 11.0, 12.0, 12.0, 31.0, 36.0, 31.0, 66.0, 102.0, 162.0, 145.0, 104.0, 71.0, 67.0, 45.0, 25.0, 21.0, 12.0, 6.0, 8.0, 8.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.282329559326172e-05, -5.9859827160835266e-05, -5.6896358728408813e-05, -5.393289029598236e-05, -5.096942186355591e-05, -4.8005953431129456e-05, -4.5042484998703e-05, -4.207901656627655e-05, -3.91155481338501e-05, -3.6152079701423645e-05, -3.318861126899719e-05, -3.022514283657074e-05, -2.7261674404144287e-05, -2.4298205971717834e-05, -2.1334737539291382e-05, -1.837126910686493e-05, -1.5407800674438477e-05, -1.2444332242012024e-05, -9.480863809585571e-06, -6.517395377159119e-06, -3.553926944732666e-06, -5.904585123062134e-07, 2.3730099201202393e-06, 5.336478352546692e-06, 8.299946784973145e-06, 1.1263415217399597e-05, 1.422688364982605e-05, 1.7190352082252502e-05, 2.0153820514678955e-05, 2.3117288947105408e-05, 2.608075737953186e-05, 2.9044225811958313e-05, 3.2007694244384766e-05, 3.497116267681122e-05, 3.793463110923767e-05, 4.0898099541664124e-05, 4.3861567974090576e-05, 4.682503640651703e-05, 4.978850483894348e-05, 5.2751973271369934e-05, 5.571544170379639e-05, 5.867891013622284e-05, 6.164237856864929e-05, 6.460584700107574e-05, 6.75693154335022e-05, 7.053278386592865e-05, 7.34962522983551e-05, 7.645972073078156e-05, 7.942318916320801e-05, 8.238665759563446e-05, 8.535012602806091e-05, 8.831359446048737e-05, 9.127706289291382e-05, 9.424053132534027e-05, 9.720399975776672e-05, 0.00010016746819019318, 0.00010313093662261963, 0.00010609440505504608, 0.00010905787348747253, 0.00011202134191989899, 0.00011498481035232544, 0.00011794827878475189, 0.00012091174721717834, 0.0001238752156496048, 0.00012683868408203125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 11.0, 11.0, 18.0, 30.0, 44.0, 71.0, 110.0, 175.0, 302.0, 599.0, 1359.0, 4037.0, 15778.0, 94715.0, 741601.0, 156602.0, 24033.0, 5563.0, 1775.0, 803.0, 372.0, 221.0, 125.0, 76.0, 51.0, 26.0, 18.0, 17.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.17820358276367188, -0.17256927490234375, -0.16693496704101562, -0.1613006591796875, -0.15566635131835938, -0.15003204345703125, -0.14439773559570312, -0.138763427734375, -0.13312911987304688, -0.12749481201171875, -0.12186050415039062, -0.1162261962890625, -0.11059188842773438, -0.10495758056640625, -0.09932327270507812, -0.09368896484375, -0.08805465698242188, -0.08242034912109375, -0.07678604125976562, -0.0711517333984375, -0.06551742553710938, -0.05988311767578125, -0.054248809814453125, -0.048614501953125, -0.042980194091796875, -0.03734588623046875, -0.031711578369140625, -0.0260772705078125, -0.020442962646484375, -0.01480865478515625, -0.009174346923828125, -0.0035400390625, 0.002094268798828125, 0.00772857666015625, 0.013362884521484375, 0.0189971923828125, 0.024631500244140625, 0.03026580810546875, 0.035900115966796875, 0.041534423828125, 0.047168731689453125, 0.05280303955078125, 0.058437347412109375, 0.0640716552734375, 0.06970596313476562, 0.07534027099609375, 0.08097457885742188, 0.08660888671875, 0.09224319458007812, 0.09787750244140625, 0.10351181030273438, 0.1091461181640625, 0.11478042602539062, 0.12041473388671875, 0.12604904174804688, 0.131683349609375, 0.13731765747070312, 0.14295196533203125, 0.14858627319335938, 0.1542205810546875, 0.15985488891601562, 0.16548919677734375, 0.17112350463867188, 0.1767578125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 16.0, 8.0, 9.0, 16.0, 9.0, 18.0, 12.0, 19.0, 34.0, 20.0, 34.0, 37.0, 45.0, 40.0, 54.0, 60.0, 61.0, 64.0, 55.0, 39.0, 43.0, 44.0, 28.0, 36.0, 39.0, 23.0, 22.0, 14.0, 17.0, 11.0, 15.0, 10.0, 13.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.104736328125, -0.1016683578491211, -0.09860038757324219, -0.09553241729736328, -0.09246444702148438, -0.08939647674560547, -0.08632850646972656, -0.08326053619384766, -0.08019256591796875, -0.07712459564208984, -0.07405662536621094, -0.07098865509033203, -0.06792068481445312, -0.06485271453857422, -0.06178474426269531, -0.058716773986816406, -0.0556488037109375, -0.052580833435058594, -0.04951286315917969, -0.04644489288330078, -0.043376922607421875, -0.04030895233154297, -0.03724098205566406, -0.034173011779785156, -0.03110504150390625, -0.028037071228027344, -0.024969100952148438, -0.02190113067626953, -0.018833160400390625, -0.01576519012451172, -0.012697219848632812, -0.009629249572753906, -0.006561279296875, -0.0034933090209960938, -0.0004253387451171875, 0.0026426315307617188, 0.005710601806640625, 0.008778572082519531, 0.011846542358398438, 0.014914512634277344, 0.01798248291015625, 0.021050453186035156, 0.024118423461914062, 0.02718639373779297, 0.030254364013671875, 0.03332233428955078, 0.03639030456542969, 0.039458274841308594, 0.0425262451171875, 0.045594215393066406, 0.04866218566894531, 0.05173015594482422, 0.054798126220703125, 0.05786609649658203, 0.06093406677246094, 0.06400203704833984, 0.06707000732421875, 0.07013797760009766, 0.07320594787597656, 0.07627391815185547, 0.07934188842773438, 0.08240985870361328, 0.08547782897949219, 0.0885457992553711, 0.09161376953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 13.0, 29.0, 78.0, 188.0, 450.0, 166.0, 52.0, 15.0, 9.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.462690353393555, -4.207821369171143, -3.9529519081115723, -3.69808292388916, -3.443213701248169, -3.1883444786071777, -2.9334754943847656, -2.6786062717437744, -2.423737049102783, -2.168867826461792, -1.9139987230300903, -1.6591296195983887, -1.4042603969573975, -1.1493911743164062, -0.8945220708847046, -0.6396529674530029, -0.3847837448120117, -0.12991458177566528, 0.12495458126068115, 0.3798237442970276, 0.634692907333374, 0.8895621299743652, 1.144431233406067, 1.3993003368377686, 1.6541695594787598, 1.909038782119751, 2.163908004760742, 2.4187769889831543, 2.6736462116241455, 2.9285154342651367, 3.183384418487549, 3.43825364112854, 3.6931228637695312, 3.9479920864105225, 4.202861309051514, 4.457730293273926, 4.712599754333496, 4.967468738555908, 5.22233772277832, 5.477207183837891, 5.732076168060303, 5.986945152282715, 6.241814613342285, 6.496683597564697, 6.751552581787109, 7.00642204284668, 7.261291027069092, 7.516160011291504, 7.771029472351074, 8.025898933410645, 8.280767440795898, 8.535636901855469, 8.790506362915039, 9.04537582397461, 9.300244331359863, 9.555113792419434, 9.809982299804688, 10.064851760864258, 10.319720268249512, 10.574589729309082, 10.829459190368652, 11.084327697753906, 11.339197158813477, 11.594066619873047, 11.848936080932617]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 10.0, 6.0, 4.0, 7.0, 11.0, 6.0, 14.0, 13.0, 18.0, 18.0, 22.0, 22.0, 26.0, 36.0, 39.0, 70.0, 103.0, 164.0, 89.0, 45.0, 37.0, 45.0, 34.0, 25.0, 27.0, 16.0, 17.0, 16.0, 13.0, 12.0, 4.0, 7.0, 5.0, 2.0, 6.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.317176342010498, -3.214874505996704, -3.112572431564331, -3.010270595550537, -2.907968521118164, -2.80566668510437, -2.703364849090576, -2.601062774658203, -2.49876070022583, -2.396458864212036, -2.294156789779663, -2.191854953765869, -2.089552879333496, -1.9872510433197021, -1.8849490880966187, -1.7826471328735352, -1.6803452968597412, -1.5780433416366577, -1.4757413864135742, -1.3734395503997803, -1.2711374759674072, -1.1688356399536133, -1.0665336847305298, -0.9642317295074463, -0.8619297742843628, -0.7596278190612793, -0.6573258638381958, -0.5550239682197571, -0.4527220129966736, -0.3504200577735901, -0.24811816215515137, -0.14581620693206787, -0.043514251708984375, 0.05878768861293793, 0.16108962893486023, 0.26339155435562134, 0.36569350957870483, 0.46799546480178833, 0.570297360420227, 0.6725993156433105, 0.774901270866394, 0.8772032260894775, 0.979505181312561, 1.0818071365356445, 1.1841089725494385, 1.2864110469818115, 1.3887128829956055, 1.491014838218689, 1.5933167934417725, 1.695618748664856, 1.7979207038879395, 1.9002225399017334, 2.0025246143341064, 2.1048264503479004, 2.2071285247802734, 2.3094303607940674, 2.4117321968078613, 2.5140340328216553, 2.6163361072540283, 2.7186379432678223, 2.8209400177001953, 2.9232418537139893, 3.025543689727783, 3.1278457641601562, 3.2301478385925293]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 7.0, 8.0, 8.0, 20.0, 14.0, 24.0, 36.0, 52.0, 107.0, 138.0, 245.0, 466.0, 986.0, 2365.0, 7424.0, 35785.0, 507727.0, 3184821.0, 410478.0, 32524.0, 6858.0, 2224.0, 899.0, 450.0, 250.0, 135.0, 79.0, 53.0, 32.0, 23.0, 14.0, 10.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61962890625, -0.6011123657226562, -0.5825958251953125, -0.5640792846679688, -0.545562744140625, -0.5270462036132812, -0.5085296630859375, -0.49001312255859375, -0.47149658203125, -0.45298004150390625, -0.4344635009765625, -0.41594696044921875, -0.397430419921875, -0.37891387939453125, -0.3603973388671875, -0.34188079833984375, -0.3233642578125, -0.30484771728515625, -0.2863311767578125, -0.26781463623046875, -0.249298095703125, -0.23078155517578125, -0.2122650146484375, -0.19374847412109375, -0.17523193359375, -0.15671539306640625, -0.1381988525390625, -0.11968231201171875, -0.101165771484375, -0.08264923095703125, -0.0641326904296875, -0.04561614990234375, -0.027099609375, -0.00858306884765625, 0.0099334716796875, 0.02845001220703125, 0.046966552734375, 0.06548309326171875, 0.0839996337890625, 0.10251617431640625, 0.12103271484375, 0.13954925537109375, 0.1580657958984375, 0.17658233642578125, 0.195098876953125, 0.21361541748046875, 0.2321319580078125, 0.25064849853515625, 0.2691650390625, 0.28768157958984375, 0.3061981201171875, 0.32471466064453125, 0.343231201171875, 0.36174774169921875, 0.3802642822265625, 0.39878082275390625, 0.41729736328125, 0.43581390380859375, 0.4543304443359375, 0.47284698486328125, 0.491363525390625, 0.5098800659179688, 0.5283966064453125, 0.5469131469726562, 0.5654296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 5.0, 4.0, 4.0, 7.0, 7.0, 14.0, 17.0, 12.0, 12.0, 21.0, 25.0, 31.0, 27.0, 34.0, 35.0, 30.0, 42.0, 37.0, 55.0, 46.0, 46.0, 48.0, 40.0, 37.0, 48.0, 36.0, 41.0, 31.0, 41.0, 34.0, 23.0, 23.0, 13.0, 21.0, 12.0, 8.0, 10.0, 9.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1585693359375, -0.1536998748779297, -0.14883041381835938, -0.14396095275878906, -0.13909149169921875, -0.13422203063964844, -0.12935256958007812, -0.12448310852050781, -0.1196136474609375, -0.11474418640136719, -0.10987472534179688, -0.10500526428222656, -0.10013580322265625, -0.09526634216308594, -0.09039688110351562, -0.08552742004394531, -0.080657958984375, -0.07578849792480469, -0.07091903686523438, -0.06604957580566406, -0.06118011474609375, -0.05631065368652344, -0.051441192626953125, -0.04657173156738281, -0.0417022705078125, -0.03683280944824219, -0.031963348388671875, -0.027093887329101562, -0.02222442626953125, -0.017354965209960938, -0.012485504150390625, -0.0076160430908203125, -0.00274658203125, 0.0021228790283203125, 0.006992340087890625, 0.011861801147460938, 0.01673126220703125, 0.021600723266601562, 0.026470184326171875, 0.03133964538574219, 0.0362091064453125, 0.04107856750488281, 0.045948028564453125, 0.05081748962402344, 0.05568695068359375, 0.06055641174316406, 0.06542587280273438, 0.07029533386230469, 0.075164794921875, 0.08003425598144531, 0.08490371704101562, 0.08977317810058594, 0.09464263916015625, 0.09951210021972656, 0.10438156127929688, 0.10925102233886719, 0.1141204833984375, 0.11898994445800781, 0.12385940551757812, 0.12872886657714844, 0.13359832763671875, 0.13846778869628906, 0.14333724975585938, 0.1482067108154297, 0.153076171875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 6.0, 11.0, 11.0, 19.0, 18.0, 35.0, 58.0, 95.0, 151.0, 276.0, 624.0, 1587.0, 6695.0, 516148.0, 3652879.0, 12005.0, 2124.0, 752.0, 362.0, 185.0, 86.0, 38.0, 34.0, 26.0, 22.0, 12.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.076171875, -2.017059326171875, -1.95794677734375, -1.898834228515625, -1.8397216796875, -1.780609130859375, -1.72149658203125, -1.662384033203125, -1.603271484375, -1.544158935546875, -1.48504638671875, -1.425933837890625, -1.3668212890625, -1.307708740234375, -1.24859619140625, -1.189483642578125, -1.13037109375, -1.071258544921875, -1.01214599609375, -0.953033447265625, -0.8939208984375, -0.834808349609375, -0.77569580078125, -0.716583251953125, -0.657470703125, -0.598358154296875, -0.53924560546875, -0.480133056640625, -0.4210205078125, -0.361907958984375, -0.30279541015625, -0.243682861328125, -0.1845703125, -0.125457763671875, -0.06634521484375, -0.007232666015625, 0.0518798828125, 0.110992431640625, 0.17010498046875, 0.229217529296875, 0.288330078125, 0.347442626953125, 0.40655517578125, 0.465667724609375, 0.5247802734375, 0.583892822265625, 0.64300537109375, 0.702117919921875, 0.76123046875, 0.820343017578125, 0.87945556640625, 0.938568115234375, 0.9976806640625, 1.056793212890625, 1.11590576171875, 1.175018310546875, 1.234130859375, 1.293243408203125, 1.35235595703125, 1.411468505859375, 1.4705810546875, 1.529693603515625, 1.58880615234375, 1.647918701171875, 1.70703125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 12.0, 17.0, 28.0, 43.0, 55.0, 98.0, 152.0, 254.0, 477.0, 742.0, 784.0, 532.0, 338.0, 202.0, 104.0, 101.0, 48.0, 31.0, 17.0, 13.0, 10.0, 4.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0654296875, -1.0366592407226562, -1.0078887939453125, -0.9791183471679688, -0.950347900390625, -0.9215774536132812, -0.8928070068359375, -0.8640365600585938, -0.83526611328125, -0.8064956665039062, -0.7777252197265625, -0.7489547729492188, -0.720184326171875, -0.6914138793945312, -0.6626434326171875, -0.6338729858398438, -0.6051025390625, -0.5763320922851562, -0.5475616455078125, -0.5187911987304688, -0.490020751953125, -0.46125030517578125, -0.4324798583984375, -0.40370941162109375, -0.37493896484375, -0.34616851806640625, -0.3173980712890625, -0.28862762451171875, -0.259857177734375, -0.23108673095703125, -0.2023162841796875, -0.17354583740234375, -0.144775390625, -0.11600494384765625, -0.0872344970703125, -0.05846405029296875, -0.029693603515625, -0.00092315673828125, 0.0278472900390625, 0.05661773681640625, 0.08538818359375, 0.11415863037109375, 0.1429290771484375, 0.17169952392578125, 0.200469970703125, 0.22924041748046875, 0.2580108642578125, 0.28678131103515625, 0.3155517578125, 0.34432220458984375, 0.3730926513671875, 0.40186309814453125, 0.430633544921875, 0.45940399169921875, 0.4881744384765625, 0.5169448852539062, 0.54571533203125, 0.5744857788085938, 0.6032562255859375, 0.6320266723632812, 0.660797119140625, 0.6895675659179688, 0.7183380126953125, 0.7471084594726562, 0.77587890625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 4.0, 7.0, 15.0, 25.0, 49.0, 110.0, 200.0, 219.0, 163.0, 93.0, 42.0, 25.0, 15.0, 8.0, 6.0, 6.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.740059852600098, -9.437098503112793, -9.134137153625488, -8.831175804138184, -8.528214454650879, -8.225253105163574, -7.922291278839111, -7.619329929351807, -7.316368579864502, -7.013407230377197, -6.710445880889893, -6.407484531402588, -6.104522705078125, -5.80156135559082, -5.498600006103516, -5.195638656616211, -4.892677307128906, -4.589715957641602, -4.286754608154297, -3.983793020248413, -3.6808316707611084, -3.3778703212738037, -3.07490873336792, -2.7719473838806152, -2.4689860343933105, -2.166024684906006, -1.8630632162094116, -1.5601017475128174, -1.2571403980255127, -0.954179048538208, -0.6512175798416138, -0.34825611114501953, -0.04529571533203125, 0.2576656937599182, 0.5606271028518677, 0.8635885119438171, 1.1665499210357666, 1.4695112705230713, 1.7724727392196655, 2.0754342079162598, 2.3783955574035645, 2.681356906890869, 2.984318256378174, 3.2872798442840576, 3.5902411937713623, 3.893202543258667, 4.196164131164551, 4.4991254806518555, 4.80208683013916, 5.105048179626465, 5.4080095291137695, 5.710970878601074, 6.013932228088379, 6.316893577575684, 6.6198554039001465, 6.922816753387451, 7.225778102874756, 7.5287394523620605, 7.831700801849365, 8.134662628173828, 8.437623977661133, 8.740585327148438, 9.043546676635742, 9.346508026123047, 9.649469375610352]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 2.0, 3.0, 3.0, 4.0, 7.0, 9.0, 10.0, 16.0, 8.0, 18.0, 16.0, 22.0, 32.0, 34.0, 35.0, 40.0, 36.0, 36.0, 46.0, 49.0, 60.0, 71.0, 57.0, 58.0, 43.0, 36.0, 45.0, 38.0, 28.0, 28.0, 21.0, 16.0, 13.0, 12.0, 16.0, 5.0, 13.0, 7.0, 5.0, 2.0, 5.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-4.816014289855957, -4.6947784423828125, -4.573542594909668, -4.452306747436523, -4.331070899963379, -4.209835529327393, -4.088599681854248, -3.9673638343811035, -3.846127986907959, -3.7248921394348145, -3.60365629196167, -3.4824206829071045, -3.36118483543396, -3.2399489879608154, -3.11871337890625, -2.9974775314331055, -2.876241683959961, -2.7550058364868164, -2.633769989013672, -2.5125343799591064, -2.391298532485962, -2.2700626850128174, -2.148827075958252, -2.0275912284851074, -1.906355381011963, -1.7851195335388184, -1.6638838052749634, -1.5426480770111084, -1.4214122295379639, -1.3001763820648193, -1.1789406538009644, -1.0577049255371094, -0.9364688396453857, -0.815233051776886, -0.6939972639083862, -0.5727614760398865, -0.4515256881713867, -0.33028990030288696, -0.2090541124343872, -0.08781832456588745, 0.033417463302612305, 0.15465325117111206, 0.2758890390396118, 0.3971248269081116, 0.5183606147766113, 0.6395964026451111, 0.7608321905136108, 0.8820679783821106, 1.0033037662506104, 1.1245396137237549, 1.2457753419876099, 1.3670110702514648, 1.4882469177246094, 1.609482765197754, 1.7307184934616089, 1.8519542217254639, 1.9731900691986084, 2.094425916671753, 2.2156615257263184, 2.336897373199463, 2.4581332206726074, 2.579369068145752, 2.7006049156188965, 2.821840524673462, 2.9430763721466064]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 12.0, 32.0, 23.0, 68.0, 129.0, 247.0, 476.0, 1001.0, 2306.0, 5941.0, 18711.0, 78560.0, 570575.0, 299694.0, 49787.0, 13080.0, 4487.0, 1794.0, 771.0, 409.0, 203.0, 94.0, 49.0, 47.0, 16.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56396484375, -0.545074462890625, -0.52618408203125, -0.507293701171875, -0.4884033203125, -0.469512939453125, -0.45062255859375, -0.431732177734375, -0.412841796875, -0.393951416015625, -0.37506103515625, -0.356170654296875, -0.3372802734375, -0.318389892578125, -0.29949951171875, -0.280609130859375, -0.26171875, -0.242828369140625, -0.22393798828125, -0.205047607421875, -0.1861572265625, -0.167266845703125, -0.14837646484375, -0.129486083984375, -0.110595703125, -0.091705322265625, -0.07281494140625, -0.053924560546875, -0.0350341796875, -0.016143798828125, 0.00274658203125, 0.021636962890625, 0.04052734375, 0.059417724609375, 0.07830810546875, 0.097198486328125, 0.1160888671875, 0.134979248046875, 0.15386962890625, 0.172760009765625, 0.191650390625, 0.210540771484375, 0.22943115234375, 0.248321533203125, 0.2672119140625, 0.286102294921875, 0.30499267578125, 0.323883056640625, 0.3427734375, 0.361663818359375, 0.38055419921875, 0.399444580078125, 0.4183349609375, 0.437225341796875, 0.45611572265625, 0.475006103515625, 0.493896484375, 0.512786865234375, 0.53167724609375, 0.550567626953125, 0.5694580078125, 0.588348388671875, 0.60723876953125, 0.626129150390625, 0.64501953125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 7.0, 15.0, 15.0, 16.0, 17.0, 27.0, 28.0, 33.0, 46.0, 47.0, 58.0, 73.0, 70.0, 74.0, 67.0, 50.0, 61.0, 63.0, 48.0, 39.0, 28.0, 25.0, 22.0, 20.0, 8.0, 8.0, 6.0, 6.0, 7.0, 1.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380859375, -0.3704032897949219, -0.35994720458984375, -0.3494911193847656, -0.3390350341796875, -0.3285789489746094, -0.31812286376953125, -0.3076667785644531, -0.297210693359375, -0.2867546081542969, -0.27629852294921875, -0.2658424377441406, -0.2553863525390625, -0.24493026733398438, -0.23447418212890625, -0.22401809692382812, -0.21356201171875, -0.20310592651367188, -0.19264984130859375, -0.18219375610351562, -0.1717376708984375, -0.16128158569335938, -0.15082550048828125, -0.14036941528320312, -0.129913330078125, -0.11945724487304688, -0.10900115966796875, -0.09854507446289062, -0.0880889892578125, -0.07763290405273438, -0.06717681884765625, -0.056720733642578125, -0.0462646484375, -0.035808563232421875, -0.02535247802734375, -0.014896392822265625, -0.0044403076171875, 0.006015777587890625, 0.01647186279296875, 0.026927947998046875, 0.037384033203125, 0.047840118408203125, 0.05829620361328125, 0.06875228881835938, 0.0792083740234375, 0.08966445922851562, 0.10012054443359375, 0.11057662963867188, 0.12103271484375, 0.13148880004882812, 0.14194488525390625, 0.15240097045898438, 0.1628570556640625, 0.17331314086914062, 0.18376922607421875, 0.19422531127929688, 0.204681396484375, 0.21513748168945312, 0.22559356689453125, 0.23604965209960938, 0.2465057373046875, 0.2569618225097656, 0.26741790771484375, 0.2778739929199219, 0.288330078125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 5.0, 14.0, 13.0, 10.0, 21.0, 37.0, 43.0, 67.0, 106.0, 150.0, 252.0, 463.0, 850.0, 2309.0, 7619.0, 43476.0, 859710.0, 112208.0, 14712.0, 3616.0, 1293.0, 611.0, 329.0, 220.0, 126.0, 87.0, 66.0, 35.0, 28.0, 14.0, 13.0, 15.0, 3.0, 6.0, 8.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.72314453125, -0.7023086547851562, -0.6814727783203125, -0.6606369018554688, -0.639801025390625, -0.6189651489257812, -0.5981292724609375, -0.5772933959960938, -0.55645751953125, -0.5356216430664062, -0.5147857666015625, -0.49394989013671875, -0.473114013671875, -0.45227813720703125, -0.4314422607421875, -0.41060638427734375, -0.3897705078125, -0.36893463134765625, -0.3480987548828125, -0.32726287841796875, -0.306427001953125, -0.28559112548828125, -0.2647552490234375, -0.24391937255859375, -0.22308349609375, -0.20224761962890625, -0.1814117431640625, -0.16057586669921875, -0.139739990234375, -0.11890411376953125, -0.0980682373046875, -0.07723236083984375, -0.056396484375, -0.03556060791015625, -0.0147247314453125, 0.00611114501953125, 0.026947021484375, 0.04778289794921875, 0.0686187744140625, 0.08945465087890625, 0.11029052734375, 0.13112640380859375, 0.1519622802734375, 0.17279815673828125, 0.193634033203125, 0.21446990966796875, 0.2353057861328125, 0.25614166259765625, 0.2769775390625, 0.29781341552734375, 0.3186492919921875, 0.33948516845703125, 0.360321044921875, 0.38115692138671875, 0.4019927978515625, 0.42282867431640625, 0.44366455078125, 0.46450042724609375, 0.4853363037109375, 0.5061721801757812, 0.527008056640625, 0.5478439331054688, 0.5686798095703125, 0.5895156860351562, 0.6103515625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 3.0, 5.0, 7.0, 8.0, 4.0, 19.0, 26.0, 19.0, 25.0, 20.0, 26.0, 42.0, 30.0, 39.0, 57.0, 80.0, 95.0, 78.0, 82.0, 44.0, 46.0, 47.0, 33.0, 25.0, 22.0, 22.0, 21.0, 15.0, 9.0, 11.0, 6.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.0966796875, -1.06072998046875, -1.0247802734375, -0.98883056640625, -0.952880859375, -0.91693115234375, -0.8809814453125, -0.84503173828125, -0.80908203125, -0.77313232421875, -0.7371826171875, -0.70123291015625, -0.665283203125, -0.62933349609375, -0.5933837890625, -0.55743408203125, -0.521484375, -0.48553466796875, -0.4495849609375, -0.41363525390625, -0.377685546875, -0.34173583984375, -0.3057861328125, -0.26983642578125, -0.23388671875, -0.19793701171875, -0.1619873046875, -0.12603759765625, -0.090087890625, -0.05413818359375, -0.0181884765625, 0.01776123046875, 0.0537109375, 0.08966064453125, 0.1256103515625, 0.16156005859375, 0.197509765625, 0.23345947265625, 0.2694091796875, 0.30535888671875, 0.34130859375, 0.37725830078125, 0.4132080078125, 0.44915771484375, 0.485107421875, 0.52105712890625, 0.5570068359375, 0.59295654296875, 0.62890625, 0.66485595703125, 0.7008056640625, 0.73675537109375, 0.772705078125, 0.80865478515625, 0.8446044921875, 0.88055419921875, 0.91650390625, 0.95245361328125, 0.9884033203125, 1.02435302734375, 1.060302734375, 1.09625244140625, 1.1322021484375, 1.16815185546875, 1.2041015625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 1.0, 3.0, 12.0, 8.0, 10.0, 14.0, 22.0, 29.0, 34.0, 52.0, 64.0, 101.0, 174.0, 276.0, 441.0, 745.0, 1422.0, 3285.0, 8104.0, 23822.0, 110196.0, 810129.0, 61603.0, 16545.0, 6003.0, 2554.0, 1217.0, 603.0, 358.0, 231.0, 157.0, 83.0, 72.0, 45.0, 32.0, 20.0, 19.0, 9.0, 11.0, 9.0, 9.0, 11.0, 9.0, 2.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.10870361328125, -0.10562801361083984, -0.10255241394042969, -0.09947681427001953, -0.09640121459960938, -0.09332561492919922, -0.09025001525878906, -0.0871744155883789, -0.08409881591796875, -0.0810232162475586, -0.07794761657714844, -0.07487201690673828, -0.07179641723632812, -0.06872081756591797, -0.06564521789550781, -0.06256961822509766, -0.0594940185546875, -0.056418418884277344, -0.05334281921386719, -0.05026721954345703, -0.047191619873046875, -0.04411602020263672, -0.04104042053222656, -0.037964820861816406, -0.03488922119140625, -0.031813621520996094, -0.028738021850585938, -0.02566242218017578, -0.022586822509765625, -0.01951122283935547, -0.016435623168945312, -0.013360023498535156, -0.010284423828125, -0.007208824157714844, -0.0041332244873046875, -0.0010576248168945312, 0.002017974853515625, 0.005093574523925781, 0.008169174194335938, 0.011244773864746094, 0.01432037353515625, 0.017395973205566406, 0.020471572875976562, 0.02354717254638672, 0.026622772216796875, 0.02969837188720703, 0.03277397155761719, 0.035849571228027344, 0.0389251708984375, 0.042000770568847656, 0.04507637023925781, 0.04815196990966797, 0.051227569580078125, 0.05430316925048828, 0.05737876892089844, 0.060454368591308594, 0.06352996826171875, 0.0666055679321289, 0.06968116760253906, 0.07275676727294922, 0.07583236694335938, 0.07890796661376953, 0.08198356628417969, 0.08505916595458984, 0.088134765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 1.0, 7.0, 10.0, 6.0, 9.0, 9.0, 19.0, 21.0, 21.0, 31.0, 40.0, 57.0, 96.0, 123.0, 151.0, 115.0, 76.0, 50.0, 28.0, 19.0, 22.0, 13.0, 15.0, 11.0, 9.0, 7.0, 9.0, 7.0, 3.0, 9.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.109476089477539e-05, -5.936063826084137e-05, -5.762651562690735e-05, -5.589239299297333e-05, -5.415827035903931e-05, -5.2424147725105286e-05, -5.0690025091171265e-05, -4.8955902457237244e-05, -4.722177982330322e-05, -4.54876571893692e-05, -4.375353455543518e-05, -4.201941192150116e-05, -4.028528928756714e-05, -3.855116665363312e-05, -3.68170440196991e-05, -3.5082921385765076e-05, -3.3348798751831055e-05, -3.1614676117897034e-05, -2.9880553483963013e-05, -2.8146430850028992e-05, -2.641230821609497e-05, -2.467818558216095e-05, -2.294406294822693e-05, -2.1209940314292908e-05, -1.9475817680358887e-05, -1.7741695046424866e-05, -1.6007572412490845e-05, -1.4273449778556824e-05, -1.2539327144622803e-05, -1.0805204510688782e-05, -9.07108187675476e-06, -7.33695924282074e-06, -5.602836608886719e-06, -3.868713974952698e-06, -2.1345913410186768e-06, -4.0046870708465576e-07, 1.3336539268493652e-06, 3.0677765607833862e-06, 4.801899194717407e-06, 6.536021828651428e-06, 8.27014446258545e-06, 1.000426709651947e-05, 1.1738389730453491e-05, 1.3472512364387512e-05, 1.5206634998321533e-05, 1.6940757632255554e-05, 1.8674880266189575e-05, 2.0409002900123596e-05, 2.2143125534057617e-05, 2.3877248167991638e-05, 2.561137080192566e-05, 2.734549343585968e-05, 2.90796160697937e-05, 3.081373870372772e-05, 3.254786133766174e-05, 3.4281983971595764e-05, 3.6016106605529785e-05, 3.7750229239463806e-05, 3.948435187339783e-05, 4.121847450733185e-05, 4.295259714126587e-05, 4.468671977519989e-05, 4.642084240913391e-05, 4.815496504306793e-05, 4.988908767700195e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 4.0, 11.0, 7.0, 16.0, 27.0, 33.0, 58.0, 84.0, 114.0, 270.0, 655.0, 1899.0, 8130.0, 58143.0, 917428.0, 51141.0, 7514.0, 1807.0, 618.0, 242.0, 111.0, 81.0, 41.0, 43.0, 20.0, 13.0, 6.0, 12.0, 1.0, 7.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1829833984375, -0.17751693725585938, -0.17205047607421875, -0.16658401489257812, -0.1611175537109375, -0.15565109252929688, -0.15018463134765625, -0.14471817016601562, -0.139251708984375, -0.13378524780273438, -0.12831878662109375, -0.12285232543945312, -0.1173858642578125, -0.11191940307617188, -0.10645294189453125, -0.10098648071289062, -0.09552001953125, -0.09005355834960938, -0.08458709716796875, -0.07912063598632812, -0.0736541748046875, -0.06818771362304688, -0.06272125244140625, -0.057254791259765625, -0.051788330078125, -0.046321868896484375, -0.04085540771484375, -0.035388946533203125, -0.0299224853515625, -0.024456024169921875, -0.01898956298828125, -0.013523101806640625, -0.008056640625, -0.002590179443359375, 0.00287628173828125, 0.008342742919921875, 0.0138092041015625, 0.019275665283203125, 0.02474212646484375, 0.030208587646484375, 0.035675048828125, 0.041141510009765625, 0.04660797119140625, 0.052074432373046875, 0.0575408935546875, 0.06300735473632812, 0.06847381591796875, 0.07394027709960938, 0.07940673828125, 0.08487319946289062, 0.09033966064453125, 0.09580612182617188, 0.1012725830078125, 0.10673904418945312, 0.11220550537109375, 0.11767196655273438, 0.123138427734375, 0.12860488891601562, 0.13407135009765625, 0.13953781127929688, 0.1450042724609375, 0.15047073364257812, 0.15593719482421875, 0.16140365600585938, 0.1668701171875]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 3.0, 11.0, 5.0, 10.0, 11.0, 19.0, 25.0, 18.0, 25.0, 45.0, 86.0, 90.0, 143.0, 140.0, 115.0, 80.0, 45.0, 41.0, 19.0, 19.0, 14.0, 10.0, 6.0, 5.0, 6.0, 7.0, 1.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.129638671875, -0.12485122680664062, -0.12006378173828125, -0.11527633666992188, -0.1104888916015625, -0.10570144653320312, -0.10091400146484375, -0.09612655639648438, -0.091339111328125, -0.08655166625976562, -0.08176422119140625, -0.07697677612304688, -0.0721893310546875, -0.06740188598632812, -0.06261444091796875, -0.057826995849609375, -0.05303955078125, -0.048252105712890625, -0.04346466064453125, -0.038677215576171875, -0.0338897705078125, -0.029102325439453125, -0.02431488037109375, -0.019527435302734375, -0.014739990234375, -0.009952545166015625, -0.00516510009765625, -0.000377655029296875, 0.0044097900390625, 0.009197235107421875, 0.01398468017578125, 0.018772125244140625, 0.0235595703125, 0.028347015380859375, 0.03313446044921875, 0.037921905517578125, 0.0427093505859375, 0.047496795654296875, 0.05228424072265625, 0.057071685791015625, 0.061859130859375, 0.06664657592773438, 0.07143402099609375, 0.07622146606445312, 0.0810089111328125, 0.08579635620117188, 0.09058380126953125, 0.09537124633789062, 0.10015869140625, 0.10494613647460938, 0.10973358154296875, 0.11452102661132812, 0.1193084716796875, 0.12409591674804688, 0.12888336181640625, 0.13367080688476562, 0.138458251953125, 0.14324569702148438, 0.14803314208984375, 0.15282058715820312, 0.1576080322265625, 0.16239547729492188, 0.16718292236328125, 0.17197036743164062, 0.1767578125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 7.0, 12.0, 21.0, 33.0, 57.0, 86.0, 498.0, 128.0, 59.0, 41.0, 24.0, 11.0, 10.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9698657989501953, -3.831636428833008, -3.6934070587158203, -3.5551774501800537, -3.416948080062866, -3.2787187099456787, -3.140489101409912, -3.0022597312927246, -2.864030361175537, -2.7258009910583496, -2.587571620941162, -2.4493420124053955, -2.311112642288208, -2.1728832721710205, -2.034653663635254, -1.8964242935180664, -1.758194923400879, -1.6199655532836914, -1.4817360639572144, -1.3435065746307373, -1.2052772045135498, -1.0670478343963623, -0.9288183450698853, -0.790588915348053, -0.6523594856262207, -0.5141300559043884, -0.37590062618255615, -0.23767119646072388, -0.0994417667388916, 0.038787662982940674, 0.17701709270477295, 0.3152465224266052, 0.4534764289855957, 0.591705858707428, 0.7299352884292603, 0.8681647181510925, 1.0063941478729248, 1.1446235179901123, 1.2828530073165894, 1.4210824966430664, 1.559311866760254, 1.6975412368774414, 1.8357707262039185, 1.9740002155303955, 2.112229585647583, 2.2504589557647705, 2.388688564300537, 2.5269179344177246, 2.665147304534912, 2.8033766746520996, 2.941606044769287, 3.0798356533050537, 3.218065023422241, 3.3562943935394287, 3.4945240020751953, 3.632753372192383, 3.7709827423095703, 3.909212112426758, 4.047441482543945, 4.185670852661133, 4.32390022277832, 4.462130069732666, 4.6003594398498535, 4.738588809967041, 4.8768181800842285]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 9.0, 4.0, 6.0, 5.0, 5.0, 14.0, 9.0, 14.0, 27.0, 17.0, 20.0, 34.0, 28.0, 36.0, 70.0, 271.0, 178.0, 35.0, 30.0, 27.0, 21.0, 21.0, 15.0, 23.0, 21.0, 11.0, 8.0, 11.0, 10.0, 3.0, 8.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4926724433898926, -3.38931941986084, -3.285966157913208, -3.182612895965576, -3.0792598724365234, -2.9759068489074707, -2.872553586959839, -2.769200325012207, -2.6658473014831543, -2.5624942779541016, -2.4591410160064697, -2.355787754058838, -2.252434730529785, -2.1490817070007324, -2.0457284450531006, -1.9423753023147583, -1.839022159576416, -1.7356690168380737, -1.6323158740997314, -1.5289627313613892, -1.4256095886230469, -1.3222564458847046, -1.2189033031463623, -1.11555016040802, -1.0121970176696777, -0.9088438749313354, -0.8054907321929932, -0.7021375894546509, -0.5987844467163086, -0.4954313039779663, -0.392078161239624, -0.28872501850128174, -0.18537187576293945, -0.08201873302459717, 0.021334409713745117, 0.1246875524520874, 0.2280406951904297, 0.331393837928772, 0.43474698066711426, 0.5381001234054565, 0.6414532661437988, 0.7448064088821411, 0.8481595516204834, 0.9515126943588257, 1.054865837097168, 1.1582189798355103, 1.2615721225738525, 1.3649252653121948, 1.468278408050537, 1.5716315507888794, 1.6749846935272217, 1.778337836265564, 1.8816909790039062, 1.9850441217422485, 2.088397264480591, 2.1917505264282227, 2.2951035499572754, 2.398456573486328, 2.50180983543396, 2.605163097381592, 2.7085161209106445, 2.8118691444396973, 2.915222406387329, 3.018575668334961, 3.1219286918640137]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 2.0, 6.0, 7.0, 11.0, 18.0, 22.0, 26.0, 27.0, 47.0, 55.0, 70.0, 221.0, 181.0, 68.0, 64.0, 57.0, 27.0, 24.0, 17.0, 13.0, 12.0, 7.0, 8.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.54931640625, -0.5359115600585938, -0.5225067138671875, -0.5091018676757812, -0.495697021484375, -0.48229217529296875, -0.4688873291015625, -0.45548248291015625, -0.44207763671875, -0.42867279052734375, -0.4152679443359375, -0.40186309814453125, -0.388458251953125, -0.37505340576171875, -0.3616485595703125, -0.34824371337890625, -0.3348388671875, -0.32143402099609375, -0.3080291748046875, -0.29462432861328125, -0.281219482421875, -0.26781463623046875, -0.2544097900390625, -0.24100494384765625, -0.22760009765625, -0.21419525146484375, -0.2007904052734375, -0.18738555908203125, -0.173980712890625, -0.16057586669921875, -0.1471710205078125, -0.13376617431640625, -0.120361328125, -0.10695648193359375, -0.0935516357421875, -0.08014678955078125, -0.066741943359375, -0.05333709716796875, -0.0399322509765625, -0.02652740478515625, -0.01312255859375, 0.00028228759765625, 0.0136871337890625, 0.02709197998046875, 0.040496826171875, 0.05390167236328125, 0.0673065185546875, 0.08071136474609375, 0.0941162109375, 0.10752105712890625, 0.1209259033203125, 0.13433074951171875, 0.147735595703125, 0.16114044189453125, 0.1745452880859375, 0.18795013427734375, 0.20135498046875, 0.21475982666015625, 0.2281646728515625, 0.24156951904296875, 0.254974365234375, 0.26837921142578125, 0.2817840576171875, 0.29518890380859375, 0.30859375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 4.0, 6.0, 16.0, 19.0, 24.0, 30.0, 49.0, 98.0, 158.0, 287.0, 699.0, 1902.0, 7964.0, 8224940.0, 143806.0, 5819.0, 1538.0, 598.0, 270.0, 145.0, 59.0, 40.0, 34.0, 20.0, 9.0, 10.0, 13.0, 5.0, 4.0, 1.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.6175522804260254, -2.5502750873565674, -2.4829978942871094, -2.4157207012176514, -2.3484435081481934, -2.2811665534973145, -2.2138891220092773, -2.1466121673583984, -2.0793349742889404, -2.0120577812194824, -1.9447805881500244, -1.8775033950805664, -1.810226321220398, -1.74294912815094, -1.675671935081482, -1.608394742012024, -1.541117548942566, -1.473840355873108, -1.40656316280365, -1.3392860889434814, -1.2720088958740234, -1.2047317028045654, -1.1374545097351074, -1.0701773166656494, -1.0029001235961914, -0.9356229305267334, -0.8683457970619202, -0.8010686039924622, -0.7337914705276489, -0.6665142774581909, -0.5992370843887329, -0.5319598913192749, -0.46468281745910645, -0.3974056541919708, -0.3301284909248352, -0.2628512978553772, -0.19557413458824158, -0.12829697132110596, -0.06101977825164795, 0.006257385015487671, 0.07353454828262329, 0.1408117115497589, 0.20808888971805573, 0.27536606788635254, 0.34264323115348816, 0.4099203944206238, 0.4771975874900818, 0.544474720954895, 0.611751914024353, 0.679029107093811, 0.7463062405586243, 0.8135834336280823, 0.8808605670928955, 0.9481377601623535, 1.0154149532318115, 1.0826921463012695, 1.1499693393707275, 1.2172465324401855, 1.2845237255096436, 1.3518009185791016, 1.41907799243927, 1.486355185508728, 1.553632378578186, 1.620909571647644, 1.6881866455078125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 2.0, 3.0, 7.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 5.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.449858546257019, -1.405657410621643, -1.3614561557769775, -1.3172550201416016, -1.2730538845062256, -1.2288527488708496, -1.184651494026184, -1.140450358390808, -1.0962492227554321, -1.0520480871200562, -1.0078468322753906, -0.9636456966400146, -0.9194445610046387, -0.8752433657646179, -0.8310421705245972, -0.7868410348892212, -0.7426398396492004, -0.6984386444091797, -0.6542375087738037, -0.610036313533783, -0.565835177898407, -0.5216339826583862, -0.47743281722068787, -0.4332316517829895, -0.38903048634529114, -0.3448293209075928, -0.3006281554698944, -0.25642699003219604, -0.2122258096933365, -0.16802464425563812, -0.12382346391677856, -0.0796222984790802, -0.035421133041381836, 0.008780036121606827, 0.05298120528459549, 0.09718237817287445, 0.14138354361057281, 0.18558470904827118, 0.22978588938713074, 0.2739870548248291, 0.31818822026252747, 0.36238938570022583, 0.4065905511379242, 0.45079171657562256, 0.4949929118156433, 0.5391940474510193, 0.58339524269104, 0.627596378326416, 0.6717975735664368, 0.7159987688064575, 0.7601999044418335, 0.8044010996818542, 0.8486022353172302, 0.892803430557251, 0.937004566192627, 0.9812057614326477, 1.0254069566726685, 1.0696080923080444, 1.11380934715271, 1.158010482788086, 1.202211618423462, 1.246412754058838, 1.2906140089035034, 1.3348151445388794, 1.3790162801742554]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 4.0, 9.0, 6.0, 18.0, 28.0, 27.0, 52.0, 96.0, 135.0, 246.0, 458.0, 838.0, 1948.0, 4494.0, 11939.0, 36896.0, 132104.0, 224156.0, 75418.0, 21935.0, 7668.0, 2919.0, 1280.0, 660.0, 370.0, 181.0, 109.0, 80.0, 60.0, 36.0, 21.0, 21.0, 18.0, 10.0, 7.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7939453125, -1.7281951904296875, -1.662445068359375, -1.5966949462890625, -1.53094482421875, -1.4651947021484375, -1.399444580078125, -1.3336944580078125, -1.2679443359375, -1.2021942138671875, -1.136444091796875, -1.0706939697265625, -1.00494384765625, -0.9391937255859375, -0.873443603515625, -0.8076934814453125, -0.741943359375, -0.6761932373046875, -0.610443115234375, -0.5446929931640625, -0.47894287109375, -0.4131927490234375, -0.347442626953125, -0.2816925048828125, -0.2159423828125, -0.1501922607421875, -0.084442138671875, -0.0186920166015625, 0.04705810546875, 0.1128082275390625, 0.178558349609375, 0.2443084716796875, 0.31005859375, 0.3758087158203125, 0.441558837890625, 0.5073089599609375, 0.57305908203125, 0.6388092041015625, 0.704559326171875, 0.7703094482421875, 0.8360595703125, 0.9018096923828125, 0.967559814453125, 1.0333099365234375, 1.09906005859375, 1.1648101806640625, 1.230560302734375, 1.2963104248046875, 1.362060546875, 1.4278106689453125, 1.493560791015625, 1.5593109130859375, 1.62506103515625, 1.6908111572265625, 1.756561279296875, 1.8223114013671875, 1.8880615234375, 1.9538116455078125, 2.019561767578125, 2.0853118896484375, 2.15106201171875, 2.2168121337890625, 2.282562255859375, 2.3483123779296875, 2.4140625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 8.0, 5.0, 11.0, 6.0, 19.0, 17.0, 26.0, 38.0, 33.0, 42.0, 62.0, 70.0, 82.0, 85.0, 83.0, 63.0, 69.0, 54.0, 33.0, 39.0, 31.0, 29.0, 21.0, 18.0, 14.0, 17.0, 4.0, 13.0, 7.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.250732421875, -0.24153518676757812, -0.23233795166015625, -0.22314071655273438, -0.2139434814453125, -0.20474624633789062, -0.19554901123046875, -0.18635177612304688, -0.177154541015625, -0.16795730590820312, -0.15876007080078125, -0.14956283569335938, -0.1403656005859375, -0.13116836547851562, -0.12197113037109375, -0.11277389526367188, -0.10357666015625, -0.09437942504882812, -0.08518218994140625, -0.07598495483398438, -0.0667877197265625, -0.057590484619140625, -0.04839324951171875, -0.039196014404296875, -0.029998779296875, -0.020801544189453125, -0.01160430908203125, -0.002407073974609375, 0.0067901611328125, 0.015987396240234375, 0.02518463134765625, 0.034381866455078125, 0.0435791015625, 0.052776336669921875, 0.06197357177734375, 0.07117080688476562, 0.0803680419921875, 0.08956527709960938, 0.09876251220703125, 0.10795974731445312, 0.117156982421875, 0.12635421752929688, 0.13555145263671875, 0.14474868774414062, 0.1539459228515625, 0.16314315795898438, 0.17234039306640625, 0.18153762817382812, 0.19073486328125, 0.19993209838867188, 0.20912933349609375, 0.21832656860351562, 0.2275238037109375, 0.23672103881835938, 0.24591827392578125, 0.2551155090332031, 0.264312744140625, 0.2735099792480469, 0.28270721435546875, 0.2919044494628906, 0.3011016845703125, 0.3102989196777344, 0.31949615478515625, 0.3286933898925781, 0.337890625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 11.0, 3.0, 15.0, 27.0, 37.0, 77.0, 96.0, 81.0, 54.0, 21.0, 22.0, 11.0, 5.0, 8.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.417670726776123, -2.3386070728302, -2.2595436573028564, -2.1804800033569336, -2.10141658782959, -2.022352933883667, -1.9432893991470337, -1.8642258644104004, -1.7851622104644775, -1.7060986757278442, -1.627035140991211, -1.547971487045288, -1.4689079523086548, -1.3898444175720215, -1.3107808828353882, -1.2317173480987549, -1.1526538133621216, -1.0735902786254883, -0.9945266842842102, -0.9154631495475769, -0.8363995552062988, -0.7573360204696655, -0.6782724857330322, -0.5992088913917542, -0.5201453566551208, -0.44108179211616516, -0.3620182275772095, -0.28295469284057617, -0.20389112830162048, -0.1248275637626648, -0.045764029026031494, 0.03329956531524658, 0.11236310005187988, 0.19142666459083557, 0.27049022912979126, 0.34955376386642456, 0.42861732840538025, 0.5076808929443359, 0.5867444276809692, 0.6658080220222473, 0.7448715567588806, 0.8239350914955139, 0.902998685836792, 0.9820622205734253, 1.0611257553100586, 1.1401894092559814, 1.2192528247833252, 1.298316478729248, 1.3773800134658813, 1.4564435482025146, 1.535507082939148, 1.6145706176757812, 1.693634271621704, 1.7726978063583374, 1.8517613410949707, 1.9308249950408936, 2.0098884105682373, 2.08895206451416, 2.168015480041504, 2.2470791339874268, 2.3261425495147705, 2.4052062034606934, 2.484269618988037, 2.56333327293396, 2.642396926879883]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 5.0, 5.0, 10.0, 15.0, 35.0, 59.0, 90.0, 107.0, 60.0, 30.0, 18.0, 3.0, 3.0, 3.0, 6.0, 3.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.895876407623291, -1.8465129137039185, -1.797149419784546, -1.747786045074463, -1.6984225511550903, -1.6490590572357178, -1.5996955633163452, -1.5503320693969727, -1.5009686946868896, -1.451605200767517, -1.4022417068481445, -1.3528783321380615, -1.303514838218689, -1.2541513442993164, -1.2047878503799438, -1.1554243564605713, -1.1060608625411987, -1.0566973686218262, -1.0073338747024536, -0.9579704403877258, -0.908607006072998, -0.8592435121536255, -0.8098800182342529, -0.7605165243148804, -0.7111530900001526, -0.66178959608078, -0.6124261617660522, -0.5630626678466797, -0.5136991739273071, -0.46433573961257935, -0.4149722456932068, -0.3656087815761566, -0.31624531745910645, -0.2668818533420563, -0.2175183743238449, -0.16815489530563354, -0.11879143118858337, -0.0694279670715332, -0.020064473152160645, 0.029298990964889526, 0.0786624550819397, 0.12802591919898987, 0.17738939821720123, 0.2267528772354126, 0.27611634135246277, 0.32547980546951294, 0.3748432993888855, 0.42420676350593567, 0.47357022762298584, 0.5229337215423584, 0.5722971558570862, 0.6216606497764587, 0.6710240840911865, 0.7203875780105591, 0.7697510719299316, 0.8191145658493042, 0.868478000164032, 0.9178414940834045, 0.9672049283981323, 1.0165684223175049, 1.0659319162368774, 1.11529541015625, 1.164658784866333, 1.2140222787857056, 1.2633857727050781]}, "_wandb": {"runtime": 2391}} \ No newline at end of file