diff --git "a/wandb/run-20220301_145657-3jv2086j/files/wandb-summary.json" "b/wandb/run-20220301_145657-3jv2086j/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220301_145657-3jv2086j/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.267, "train/learning_rate": 2.682e-05, "train/epoch": 0.88, "train/global_step": 450, "_runtime": 4134, "_timestamp": 1646150751, "_step": 449, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 12.0, 148.0, 459.0, 311.0, 75.0, 6.0, 1.0, 2.0], "bins": [-266.0886535644531, -261.56781005859375, -257.0469970703125, -252.5261688232422, -248.00534057617188, -243.4844970703125, -238.96368408203125, -234.44284057617188, -229.92201232910156, -225.40118408203125, -220.88035583496094, -216.35952758789062, -211.8386993408203, -207.31787109375, -202.79702758789062, -198.2761993408203, -193.75537109375, -189.2345428466797, -184.71371459960938, -180.19288635253906, -175.67205810546875, -171.15121459960938, -166.63040161132812, -162.10955810546875, -157.5887451171875, -153.0679168701172, -148.54708862304688, -144.02626037597656, -139.50543212890625, -134.98458862304688, -130.46377563476562, -125.94293975830078, -121.42211151123047, -116.90128326416016, -112.38045501708984, -107.859619140625, -103.33879089355469, -98.81796264648438, -94.29713439941406, -89.77630615234375, -85.2554702758789, -80.7346420288086, -76.21381378173828, -71.69297790527344, -67.17214965820312, -62.65132141113281, -58.1304931640625, -53.60966491699219, -49.088836669921875, -44.56800842285156, -40.047176361083984, -35.52634811401367, -31.005517959594727, -26.48468780517578, -21.96385955810547, -17.443029403686523, -12.922197341918945, -8.4013671875, -3.880537986755371, 0.6402912139892578, 5.161121368408203, 9.681951522827148, 14.202779769897461, 18.723609924316406, 23.24444007873535]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 6.0, 10.0, 11.0, 15.0, 14.0, 24.0, 20.0, 33.0, 35.0, 46.0, 39.0, 46.0, 55.0, 56.0, 57.0, 59.0, 60.0, 46.0, 51.0, 46.0, 45.0, 31.0, 40.0, 29.0, 20.0, 29.0, 17.0, 9.0, 11.0, 9.0, 11.0, 8.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.9656982421875, -48.96318054199219, -46.96065902709961, -44.9581413269043, -42.95561981201172, -40.953102111816406, -38.950584411621094, -36.948062896728516, -34.94554138183594, -32.943023681640625, -30.940502166748047, -28.937984466552734, -26.935462951660156, -24.932945251464844, -22.9304256439209, -20.927906036376953, -18.92538833618164, -16.922868728637695, -14.92034912109375, -12.917830467224121, -10.915310859680176, -8.91279125213623, -6.910272598266602, -4.907752990722656, -2.905233383178711, -0.9027140140533447, 1.0998053550720215, 3.1023244857788086, 5.104844093322754, 7.107363700866699, 9.109882354736328, 11.112401962280273, 13.114921569824219, 15.117441177368164, 17.11996078491211, 19.122478485107422, 21.125, 23.127517700195312, 25.130037307739258, 27.132556915283203, 29.13507652282715, 31.137596130371094, 33.140113830566406, 35.142635345458984, 37.1451530456543, 39.147674560546875, 41.15019226074219, 43.1527099609375, 45.15523147583008, 47.15774917602539, 49.16027069091797, 51.16278839111328, 53.16530990600586, 55.16782760620117, 57.17034912109375, 59.17286682128906, 61.175384521484375, 63.17790222167969, 65.180419921875, 67.18294525146484, 69.18546295166016, 71.18798065185547, 73.19049835205078, 75.19302368164062, 77.19554138183594]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 9.0, 8.0, 12.0, 6.0, 14.0, 18.0, 18.0, 24.0, 25.0, 31.0, 39.0, 34.0, 48.0, 40.0, 48.0, 55.0, 51.0, 51.0, 48.0, 45.0, 42.0, 32.0, 54.0, 40.0, 44.0, 28.0, 29.0, 23.0, 11.0, 10.0, 16.0, 11.0, 7.0, 9.0, 11.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.974609375, -3.8553466796875, -3.736083984375, -3.6168212890625, -3.49755859375, -3.3782958984375, -3.259033203125, -3.1397705078125, -3.0205078125, -2.9012451171875, -2.781982421875, -2.6627197265625, -2.54345703125, -2.4241943359375, -2.304931640625, -2.1856689453125, -2.06640625, -1.9471435546875, -1.827880859375, -1.7086181640625, -1.58935546875, -1.4700927734375, -1.350830078125, -1.2315673828125, -1.1123046875, -0.9930419921875, -0.873779296875, -0.7545166015625, -0.63525390625, -0.5159912109375, -0.396728515625, -0.2774658203125, -0.158203125, -0.0389404296875, 0.080322265625, 0.1995849609375, 0.31884765625, 0.4381103515625, 0.557373046875, 0.6766357421875, 0.7958984375, 0.9151611328125, 1.034423828125, 1.1536865234375, 1.27294921875, 1.3922119140625, 1.511474609375, 1.6307373046875, 1.75, 1.8692626953125, 1.988525390625, 2.1077880859375, 2.22705078125, 2.3463134765625, 2.465576171875, 2.5848388671875, 2.7041015625, 2.8233642578125, 2.942626953125, 3.0618896484375, 3.18115234375, 3.3004150390625, 3.419677734375, 3.5389404296875, 3.658203125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 5.0, 3.0, 4.0, 6.0, 5.0, 8.0, 11.0, 15.0, 31.0, 55.0, 45.0, 88.0, 146.0, 208.0, 295.0, 526.0, 823.0, 1577.0, 3054.0, 7108.0, 22765.0, 140346.0, 1852395.0, 1972359.0, 154676.0, 23609.0, 7166.0, 3069.0, 1561.0, 851.0, 557.0, 301.0, 195.0, 108.0, 95.0, 69.0, 42.0, 40.0, 29.0, 10.0, 14.0, 8.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.75, -9.375244140625, -9.00048828125, -8.625732421875, -8.2509765625, -7.876220703125, -7.50146484375, -7.126708984375, -6.751953125, -6.377197265625, -6.00244140625, -5.627685546875, -5.2529296875, -4.878173828125, -4.50341796875, -4.128662109375, -3.75390625, -3.379150390625, -3.00439453125, -2.629638671875, -2.2548828125, -1.880126953125, -1.50537109375, -1.130615234375, -0.755859375, -0.381103515625, -0.00634765625, 0.368408203125, 0.7431640625, 1.117919921875, 1.49267578125, 1.867431640625, 2.2421875, 2.616943359375, 2.99169921875, 3.366455078125, 3.7412109375, 4.115966796875, 4.49072265625, 4.865478515625, 5.240234375, 5.614990234375, 5.98974609375, 6.364501953125, 6.7392578125, 7.114013671875, 7.48876953125, 7.863525390625, 8.23828125, 8.613037109375, 8.98779296875, 9.362548828125, 9.7373046875, 10.112060546875, 10.48681640625, 10.861572265625, 11.236328125, 11.611083984375, 11.98583984375, 12.360595703125, 12.7353515625, 13.110107421875, 13.48486328125, 13.859619140625, 14.234375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 6.0, 6.0, 20.0, 30.0, 44.0, 90.0, 120.0, 229.0, 376.0, 591.0, 803.0, 660.0, 424.0, 268.0, 160.0, 89.0, 45.0, 47.0, 20.0, 13.0, 16.0, 6.0, 3.0, 2.0, 4.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.65625, -20.076171875, -19.49609375, -18.916015625, -18.3359375, -17.755859375, -17.17578125, -16.595703125, -16.015625, -15.435546875, -14.85546875, -14.275390625, -13.6953125, -13.115234375, -12.53515625, -11.955078125, -11.375, -10.794921875, -10.21484375, -9.634765625, -9.0546875, -8.474609375, -7.89453125, -7.314453125, -6.734375, -6.154296875, -5.57421875, -4.994140625, -4.4140625, -3.833984375, -3.25390625, -2.673828125, -2.09375, -1.513671875, -0.93359375, -0.353515625, 0.2265625, 0.806640625, 1.38671875, 1.966796875, 2.546875, 3.126953125, 3.70703125, 4.287109375, 4.8671875, 5.447265625, 6.02734375, 6.607421875, 7.1875, 7.767578125, 8.34765625, 8.927734375, 9.5078125, 10.087890625, 10.66796875, 11.248046875, 11.828125, 12.408203125, 12.98828125, 13.568359375, 14.1484375, 14.728515625, 15.30859375, 15.888671875, 16.46875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 9.0, 10.0, 19.0, 19.0, 46.0, 76.0, 125.0, 233.0, 445.0, 945.0, 2549.0, 42801.0, 4098403.0, 43997.0, 2543.0, 993.0, 463.0, 230.0, 163.0, 74.0, 45.0, 33.0, 14.0, 17.0, 11.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.1875, -57.2470703125, -55.306640625, -53.3662109375, -51.42578125, -49.4853515625, -47.544921875, -45.6044921875, -43.6640625, -41.7236328125, -39.783203125, -37.8427734375, -35.90234375, -33.9619140625, -32.021484375, -30.0810546875, -28.140625, -26.2001953125, -24.259765625, -22.3193359375, -20.37890625, -18.4384765625, -16.498046875, -14.5576171875, -12.6171875, -10.6767578125, -8.736328125, -6.7958984375, -4.85546875, -2.9150390625, -0.974609375, 0.9658203125, 2.90625, 4.8466796875, 6.787109375, 8.7275390625, 10.66796875, 12.6083984375, 14.548828125, 16.4892578125, 18.4296875, 20.3701171875, 22.310546875, 24.2509765625, 26.19140625, 28.1318359375, 30.072265625, 32.0126953125, 33.953125, 35.8935546875, 37.833984375, 39.7744140625, 41.71484375, 43.6552734375, 45.595703125, 47.5361328125, 49.4765625, 51.4169921875, 53.357421875, 55.2978515625, 57.23828125, 59.1787109375, 61.119140625, 63.0595703125, 65.0]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 53.0, 301.0, 464.0, 165.0, 26.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.4249267578125, -214.96035766601562, -210.49578857421875, -206.0312042236328, -201.56663513183594, -197.10206604003906, -192.6374969482422, -188.1729278564453, -183.70834350585938, -179.2437744140625, -174.77920532226562, -170.3146209716797, -165.8500518798828, -161.38548278808594, -156.92091369628906, -152.4563446044922, -147.9917755126953, -143.52720642089844, -139.06263732910156, -134.59805297851562, -130.13348388671875, -125.66891479492188, -121.204345703125, -116.73977661132812, -112.27519989013672, -107.81063079833984, -103.34605407714844, -98.88148498535156, -94.41691589355469, -89.95233917236328, -85.4877700805664, -81.023193359375, -76.55862426757812, -72.09405517578125, -67.62947845458984, -63.16490936279297, -58.70033645629883, -54.23576354980469, -49.77119445800781, -45.30662155151367, -40.84204864501953, -36.37747573852539, -31.912904739379883, -27.448333740234375, -22.983760833740234, -18.519187927246094, -14.054616928100586, -9.590045928955078, -5.1254730224609375, -0.6609010696411133, 3.803670883178711, 8.268242835998535, 12.73281478881836, 17.1973876953125, 21.661958694458008, 26.126529693603516, 30.591102600097656, 35.0556755065918, 39.52024841308594, 43.98481750488281, 48.44939041137695, 52.913963317871094, 57.37853240966797, 61.84310531616211, 66.30767822265625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 1.0, 2.0, 6.0, 6.0, 10.0, 11.0, 12.0, 12.0, 20.0, 32.0, 42.0, 32.0, 26.0, 46.0, 35.0, 54.0, 55.0, 47.0, 57.0, 52.0, 61.0, 54.0, 46.0, 41.0, 39.0, 39.0, 28.0, 30.0, 24.0, 16.0, 16.0, 16.0, 10.0, 12.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-61.339256286621094, -59.79381561279297, -58.248374938964844, -56.70293426513672, -55.157493591308594, -53.61205291748047, -52.066612243652344, -50.52117156982422, -48.975730895996094, -47.43029022216797, -45.884849548339844, -44.33940887451172, -42.793968200683594, -41.24852752685547, -39.703086853027344, -38.15764617919922, -36.612205505371094, -35.06676483154297, -33.521324157714844, -31.97588348388672, -30.430442810058594, -28.88500213623047, -27.339561462402344, -25.79412078857422, -24.24868392944336, -22.703243255615234, -21.15780258178711, -19.612361907958984, -18.06692123413086, -16.521480560302734, -14.976040840148926, -13.4306001663208, -11.88515853881836, -10.339717864990234, -8.79427719116211, -7.248836994171143, -5.703396320343018, -4.157955646514893, -2.612515449523926, -1.0670747756958008, 0.4783658981323242, 2.023806571960449, 3.569247007369995, 5.114687442779541, 6.660128116607666, 8.205568313598633, 9.751008987426758, 11.296449661254883, 12.841890335083008, 14.387331008911133, 15.932771682739258, 17.478212356567383, 19.023653030395508, 20.569093704223633, 22.114532470703125, 23.65997314453125, 25.205413818359375, 26.7508544921875, 28.296295166015625, 29.84173583984375, 31.387176513671875, 32.9326171875, 34.478057861328125, 36.02349853515625, 37.568939208984375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 7.0, 12.0, 7.0, 3.0, 13.0, 9.0, 21.0, 20.0, 17.0, 28.0, 23.0, 29.0, 24.0, 34.0, 30.0, 35.0, 33.0, 39.0, 45.0, 42.0, 43.0, 36.0, 46.0, 39.0, 32.0, 38.0, 42.0, 37.0, 23.0, 26.0, 22.0, 19.0, 25.0, 18.0, 17.0, 13.0, 9.0, 10.0, 9.0, 8.0, 5.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0], "bins": [-3.94140625, -3.836181640625, -3.73095703125, -3.625732421875, -3.5205078125, -3.415283203125, -3.31005859375, -3.204833984375, -3.099609375, -2.994384765625, -2.88916015625, -2.783935546875, -2.6787109375, -2.573486328125, -2.46826171875, -2.363037109375, -2.2578125, -2.152587890625, -2.04736328125, -1.942138671875, -1.8369140625, -1.731689453125, -1.62646484375, -1.521240234375, -1.416015625, -1.310791015625, -1.20556640625, -1.100341796875, -0.9951171875, -0.889892578125, -0.78466796875, -0.679443359375, -0.57421875, -0.468994140625, -0.36376953125, -0.258544921875, -0.1533203125, -0.048095703125, 0.05712890625, 0.162353515625, 0.267578125, 0.372802734375, 0.47802734375, 0.583251953125, 0.6884765625, 0.793701171875, 0.89892578125, 1.004150390625, 1.109375, 1.214599609375, 1.31982421875, 1.425048828125, 1.5302734375, 1.635498046875, 1.74072265625, 1.845947265625, 1.951171875, 2.056396484375, 2.16162109375, 2.266845703125, 2.3720703125, 2.477294921875, 2.58251953125, 2.687744140625, 2.79296875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 7.0, 8.0, 18.0, 26.0, 36.0, 56.0, 94.0, 122.0, 204.0, 340.0, 489.0, 761.0, 1160.0, 1890.0, 2995.0, 5042.0, 8198.0, 13115.0, 21872.0, 37424.0, 65307.0, 117877.0, 204565.0, 233160.0, 143749.0, 78610.0, 44590.0, 26445.0, 15524.0, 9360.0, 5850.0, 3626.0, 2177.0, 1461.0, 862.0, 566.0, 327.0, 219.0, 144.0, 87.0, 62.0, 38.0, 32.0, 21.0, 11.0, 15.0, 3.0, 5.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.486572265625, -0.4709587097167969, -0.45534515380859375, -0.4397315979003906, -0.4241180419921875, -0.4085044860839844, -0.39289093017578125, -0.3772773742675781, -0.361663818359375, -0.3460502624511719, -0.33043670654296875, -0.3148231506347656, -0.2992095947265625, -0.2835960388183594, -0.26798248291015625, -0.2523689270019531, -0.23675537109375, -0.22114181518554688, -0.20552825927734375, -0.18991470336914062, -0.1743011474609375, -0.15868759155273438, -0.14307403564453125, -0.12746047973632812, -0.111846923828125, -0.09623336791992188, -0.08061981201171875, -0.06500625610351562, -0.0493927001953125, -0.033779144287109375, -0.01816558837890625, -0.002552032470703125, 0.0130615234375, 0.028675079345703125, 0.04428863525390625, 0.059902191162109375, 0.0755157470703125, 0.09112930297851562, 0.10674285888671875, 0.12235641479492188, 0.137969970703125, 0.15358352661132812, 0.16919708251953125, 0.18481063842773438, 0.2004241943359375, 0.21603775024414062, 0.23165130615234375, 0.24726486206054688, 0.26287841796875, 0.2784919738769531, 0.29410552978515625, 0.3097190856933594, 0.3253326416015625, 0.3409461975097656, 0.35655975341796875, 0.3721733093261719, 0.387786865234375, 0.4034004211425781, 0.41901397705078125, 0.4346275329589844, 0.4502410888671875, 0.4658546447753906, 0.48146820068359375, 0.4970817565917969, 0.5126953125]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 3.0, 9.0, 7.0, 13.0, 13.0, 17.0, 18.0, 22.0, 30.0, 27.0, 33.0, 32.0, 31.0, 44.0, 41.0, 47.0, 45.0, 49.0, 1078.0, 46.0, 52.0, 36.0, 45.0, 44.0, 38.0, 40.0, 31.0, 29.0, 26.0, 18.0, 16.0, 11.0, 5.0, 9.0, 4.0, 6.0, 3.0, 4.0, 5.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-3.00390625, -2.925567626953125, -2.84722900390625, -2.768890380859375, -2.6905517578125, -2.612213134765625, -2.53387451171875, -2.455535888671875, -2.377197265625, -2.298858642578125, -2.22052001953125, -2.142181396484375, -2.0638427734375, -1.985504150390625, -1.90716552734375, -1.828826904296875, -1.75048828125, -1.672149658203125, -1.59381103515625, -1.515472412109375, -1.4371337890625, -1.358795166015625, -1.28045654296875, -1.202117919921875, -1.123779296875, -1.045440673828125, -0.96710205078125, -0.888763427734375, -0.8104248046875, -0.732086181640625, -0.65374755859375, -0.575408935546875, -0.4970703125, -0.418731689453125, -0.34039306640625, -0.262054443359375, -0.1837158203125, -0.105377197265625, -0.02703857421875, 0.051300048828125, 0.129638671875, 0.207977294921875, 0.28631591796875, 0.364654541015625, 0.4429931640625, 0.521331787109375, 0.59967041015625, 0.678009033203125, 0.75634765625, 0.834686279296875, 0.91302490234375, 0.991363525390625, 1.0697021484375, 1.148040771484375, 1.22637939453125, 1.304718017578125, 1.383056640625, 1.461395263671875, 1.53973388671875, 1.618072509765625, 1.6964111328125, 1.774749755859375, 1.85308837890625, 1.931427001953125, 2.009765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 7.0, 16.0, 25.0, 28.0, 41.0, 53.0, 88.0, 153.0, 230.0, 319.0, 523.0, 843.0, 1314.0, 1993.0, 3292.0, 5211.0, 8386.0, 14057.0, 23732.0, 40847.0, 72327.0, 129746.0, 220320.0, 1251752.0, 137627.0, 76986.0, 43424.0, 25205.0, 14839.0, 9024.0, 5518.0, 3449.0, 2084.0, 1384.0, 798.0, 513.0, 329.0, 223.0, 143.0, 99.0, 52.0, 39.0, 23.0, 19.0, 20.0, 7.0, 7.0, 7.0, 4.0, 6.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.441162109375, -0.4278144836425781, -0.41446685791015625, -0.4011192321777344, -0.3877716064453125, -0.3744239807128906, -0.36107635498046875, -0.3477287292480469, -0.334381103515625, -0.3210334777832031, -0.30768585205078125, -0.2943382263183594, -0.2809906005859375, -0.2676429748535156, -0.25429534912109375, -0.24094772338867188, -0.22760009765625, -0.21425247192382812, -0.20090484619140625, -0.18755722045898438, -0.1742095947265625, -0.16086196899414062, -0.14751434326171875, -0.13416671752929688, -0.120819091796875, -0.10747146606445312, -0.09412384033203125, -0.08077621459960938, -0.0674285888671875, -0.054080963134765625, -0.04073333740234375, -0.027385711669921875, -0.0140380859375, -0.000690460205078125, 0.01265716552734375, 0.026004791259765625, 0.0393524169921875, 0.052700042724609375, 0.06604766845703125, 0.07939529418945312, 0.092742919921875, 0.10609054565429688, 0.11943817138671875, 0.13278579711914062, 0.1461334228515625, 0.15948104858398438, 0.17282867431640625, 0.18617630004882812, 0.19952392578125, 0.21287155151367188, 0.22621917724609375, 0.23956680297851562, 0.2529144287109375, 0.2662620544433594, 0.27960968017578125, 0.2929573059082031, 0.306304931640625, 0.3196525573730469, 0.33300018310546875, 0.3463478088378906, 0.3596954345703125, 0.3730430603027344, 0.38639068603515625, 0.3997383117675781, 0.4130859375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 7.0, 5.0, 13.0, 21.0, 17.0, 24.0, 26.0, 28.0, 43.0, 51.0, 51.0, 58.0, 54.0, 66.0, 78.0, 48.0, 47.0, 56.0, 56.0, 38.0, 37.0, 42.0, 32.0, 20.0, 23.0, 19.0, 15.0, 9.0, 8.0, 5.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009026527404785156, -0.000867791473865509, -0.0008329302072525024, -0.0007980689406394958, -0.0007632076740264893, -0.0007283464074134827, -0.0006934851408004761, -0.0006586238741874695, -0.0006237626075744629, -0.0005889013409614563, -0.0005540400743484497, -0.0005191788077354431, -0.0004843175411224365, -0.00044945627450942993, -0.00041459500789642334, -0.00037973374128341675, -0.00034487247467041016, -0.00031001120805740356, -0.00027514994144439697, -0.00024028867483139038, -0.0002054274082183838, -0.0001705661416053772, -0.0001357048749923706, -0.00010084360837936401, -6.598234176635742e-05, -3.112107515335083e-05, 3.7401914596557617e-06, 3.8601458072662354e-05, 7.346272468566895e-05, 0.00010832399129867554, 0.00014318525791168213, 0.00017804652452468872, 0.0002129077911376953, 0.0002477690577507019, 0.0002826303243637085, 0.0003174915909767151, 0.0003523528575897217, 0.00038721412420272827, 0.00042207539081573486, 0.00045693665742874146, 0.000491797924041748, 0.0005266591906547546, 0.0005615204572677612, 0.0005963817238807678, 0.0006312429904937744, 0.000666104257106781, 0.0007009655237197876, 0.0007358267903327942, 0.0007706880569458008, 0.0008055493235588074, 0.000840410590171814, 0.0008752718567848206, 0.0009101331233978271, 0.0009449943900108337, 0.0009798556566238403, 0.001014716923236847, 0.0010495781898498535, 0.00108443945646286, 0.0011193007230758667, 0.0011541619896888733, 0.0011890232563018799, 0.0012238845229148865, 0.001258745789527893, 0.0012936070561408997, 0.0013284683227539062]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 4.0, 2.0, 4.0, 8.0, 24.0, 33.0, 42.0, 74.0, 71.0, 86.0, 131.0, 159.0, 239.0, 352.0, 520.0, 1330.0, 1040715.0, 2849.0, 647.0, 347.0, 236.0, 171.0, 138.0, 108.0, 77.0, 69.0, 35.0, 37.0, 12.0, 11.0, 15.0, 3.0, 1.0, 1.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0253143310546875, -0.024603843688964844, -0.023893356323242188, -0.02318286895751953, -0.022472381591796875, -0.02176189422607422, -0.021051406860351562, -0.020340919494628906, -0.01963043212890625, -0.018919944763183594, -0.018209457397460938, -0.01749897003173828, -0.016788482666015625, -0.01607799530029297, -0.015367507934570312, -0.014657020568847656, -0.013946533203125, -0.013236045837402344, -0.012525558471679688, -0.011815071105957031, -0.011104583740234375, -0.010394096374511719, -0.009683609008789062, -0.008973121643066406, -0.00826263427734375, -0.007552146911621094, -0.0068416595458984375, -0.006131172180175781, -0.005420684814453125, -0.004710197448730469, -0.0039997100830078125, -0.0032892227172851562, -0.0025787353515625, -0.0018682479858398438, -0.0011577606201171875, -0.00044727325439453125, 0.000263214111328125, 0.0009737014770507812, 0.0016841888427734375, 0.0023946762084960938, 0.00310516357421875, 0.0038156509399414062, 0.0045261383056640625, 0.005236625671386719, 0.005947113037109375, 0.006657600402832031, 0.0073680877685546875, 0.008078575134277344, 0.0087890625, 0.009499549865722656, 0.010210037231445312, 0.010920524597167969, 0.011631011962890625, 0.012341499328613281, 0.013051986694335938, 0.013762474060058594, 0.01447296142578125, 0.015183448791503906, 0.015893936157226562, 0.01660442352294922, 0.017314910888671875, 0.01802539825439453, 0.018735885620117188, 0.019446372985839844, 0.0201568603515625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 822.0, 191.0, 1.0, 0.0, 1.0], "bins": [-0.0092241782695055, -0.009069911204278469, -0.008915645070374012, -0.00876137800514698, -0.008607110939919949, -0.008452844806015491, -0.00829857774078846, -0.008144311606884003, -0.007990044541656971, -0.00783577747642994, -0.007681510876864195, -0.0075272442772984505, -0.007372977677732706, -0.007218711078166962, -0.00706444401293993, -0.0069101774133741856, -0.006755910813808441, -0.006601644214242697, -0.006447377149015665, -0.006293110549449921, -0.006138843949884176, -0.005984577350318432, -0.0058303102850914, -0.005676043685525656, -0.005521776620298624, -0.00536751002073288, -0.005213242955505848, -0.0050589763559401035, -0.004904709756374359, -0.004750443156808615, -0.004596176091581583, -0.004441909492015839, -0.004287642426788807, -0.0041333758272230625, -0.003979108761996031, -0.0038248421624302864, -0.003670575562864542, -0.003516308730468154, -0.003362041898071766, -0.0032077752985060215, -0.003053508698940277, -0.002899241866543889, -0.0027449752669781446, -0.0025907084345817566, -0.002436441835016012, -0.002282175002619624, -0.002127908170223236, -0.0019736415706574917, -0.0018193749710917473, -0.001665108255110681, -0.0015108415391296148, -0.0013565747067332268, -0.0012023081071674824, -0.0010480412747710943, -0.0008937745587900281, -0.0007395078428089619, -0.0005852410686202347, -0.0004309743526391685, -0.0002767076075542718, -0.00012244086246937513, 3.1825853511691093e-05, 0.00018609256949275732, 0.00034035934368148446, 0.0004946260596625507, 0.0006488927756436169]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 10.0, 9.0, 11.0, 19.0, 18.0, 22.0, 21.0, 30.0, 24.0, 18.0, 34.0, 26.0, 48.0, 24.0, 36.0, 39.0, 38.0, 39.0, 44.0, 45.0, 45.0, 35.0, 25.0, 39.0, 39.0, 20.0, 38.0, 35.0, 25.0, 22.0, 15.0, 15.0, 17.0, 13.0, 13.0, 6.0, 11.0, 5.0, 7.0, 3.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0004888176918029785, -0.0004729153588414192, -0.0004570130258798599, -0.00044111069291830063, -0.00042520835995674133, -0.00040930602699518204, -0.00039340369403362274, -0.00037750136107206345, -0.00036159902811050415, -0.00034569669514894485, -0.00032979436218738556, -0.00031389202922582626, -0.00029798969626426697, -0.00028208736330270767, -0.0002661850303411484, -0.0002502826973795891, -0.00023438036441802979, -0.0002184780314564705, -0.0002025756984949112, -0.0001866733655333519, -0.0001707710325717926, -0.0001548686996102333, -0.000138966366648674, -0.00012306403368711472, -0.00010716170072555542, -9.125936776399612e-05, -7.535703480243683e-05, -5.945470184087753e-05, -4.355236887931824e-05, -2.765003591775894e-05, -1.1747702956199646e-05, 4.15463000535965e-06, 2.0056962966918945e-05, 3.595929592847824e-05, 5.186162889003754e-05, 6.776396185159683e-05, 8.366629481315613e-05, 9.956862777471542e-05, 0.00011547096073627472, 0.00013137329369783401, 0.0001472756266593933, 0.0001631779596209526, 0.0001790802925825119, 0.0001949826255440712, 0.0002108849585056305, 0.0002267872914671898, 0.00024268962442874908, 0.0002585919573903084, 0.0002744942903518677, 0.00029039662331342697, 0.00030629895627498627, 0.00032220128923654556, 0.00033810362219810486, 0.00035400595515966415, 0.00036990828812122345, 0.00038581062108278275, 0.00040171295404434204, 0.00041761528700590134, 0.00043351761996746063, 0.00044941995292901993, 0.0004653222858905792, 0.0004812246188521385, 0.0004971269518136978, 0.0005130292847752571, 0.0005289316177368164]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 7.0, 12.0, 7.0, 3.0, 13.0, 9.0, 21.0, 20.0, 17.0, 28.0, 23.0, 29.0, 24.0, 34.0, 30.0, 35.0, 33.0, 39.0, 46.0, 41.0, 43.0, 36.0, 46.0, 39.0, 32.0, 38.0, 42.0, 37.0, 23.0, 26.0, 22.0, 19.0, 25.0, 18.0, 17.0, 13.0, 9.0, 10.0, 9.0, 8.0, 5.0, 3.0, 1.0, 6.0, 3.0, 2.0, 2.0], "bins": [-3.94140625, -3.836181640625, -3.73095703125, -3.625732421875, -3.5205078125, -3.415283203125, -3.31005859375, -3.204833984375, -3.099609375, -2.994384765625, -2.88916015625, -2.783935546875, -2.6787109375, -2.573486328125, -2.46826171875, -2.363037109375, -2.2578125, -2.152587890625, -2.04736328125, -1.942138671875, -1.8369140625, -1.731689453125, -1.62646484375, -1.521240234375, -1.416015625, -1.310791015625, -1.20556640625, -1.100341796875, -0.9951171875, -0.889892578125, -0.78466796875, -0.679443359375, -0.57421875, -0.468994140625, -0.36376953125, -0.258544921875, -0.1533203125, -0.048095703125, 0.05712890625, 0.162353515625, 0.267578125, 0.372802734375, 0.47802734375, 0.583251953125, 0.6884765625, 0.793701171875, 0.89892578125, 1.004150390625, 1.109375, 1.214599609375, 1.31982421875, 1.425048828125, 1.5302734375, 1.635498046875, 1.74072265625, 1.845947265625, 1.951171875, 2.056396484375, 2.16162109375, 2.266845703125, 2.3720703125, 2.477294921875, 2.58251953125, 2.687744140625, 2.79296875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 1.0, 8.0, 11.0, 13.0, 20.0, 21.0, 29.0, 40.0, 71.0, 55.0, 89.0, 141.0, 191.0, 245.0, 326.0, 399.0, 600.0, 904.0, 1227.0, 1589.0, 2385.0, 3935.0, 6542.0, 12929.0, 37855.0, 608230.0, 314125.0, 28372.0, 11023.0, 5757.0, 3544.0, 2248.0, 1575.0, 1079.0, 789.0, 592.0, 407.0, 311.0, 230.0, 176.0, 124.0, 96.0, 66.0, 44.0, 38.0, 33.0, 18.0, 20.0, 13.0, 6.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-17.4375, -16.890869140625, -16.34423828125, -15.797607421875, -15.2509765625, -14.704345703125, -14.15771484375, -13.611083984375, -13.064453125, -12.517822265625, -11.97119140625, -11.424560546875, -10.8779296875, -10.331298828125, -9.78466796875, -9.238037109375, -8.69140625, -8.144775390625, -7.59814453125, -7.051513671875, -6.5048828125, -5.958251953125, -5.41162109375, -4.864990234375, -4.318359375, -3.771728515625, -3.22509765625, -2.678466796875, -2.1318359375, -1.585205078125, -1.03857421875, -0.491943359375, 0.0546875, 0.601318359375, 1.14794921875, 1.694580078125, 2.2412109375, 2.787841796875, 3.33447265625, 3.881103515625, 4.427734375, 4.974365234375, 5.52099609375, 6.067626953125, 6.6142578125, 7.160888671875, 7.70751953125, 8.254150390625, 8.80078125, 9.347412109375, 9.89404296875, 10.440673828125, 10.9873046875, 11.533935546875, 12.08056640625, 12.627197265625, 13.173828125, 13.720458984375, 14.26708984375, 14.813720703125, 15.3603515625, 15.906982421875, 16.45361328125, 17.000244140625, 17.546875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 8.0, 6.0, 4.0, 7.0, 5.0, 16.0, 10.0, 14.0, 19.0, 22.0, 22.0, 24.0, 33.0, 26.0, 23.0, 39.0, 37.0, 40.0, 44.0, 79.0, 223.0, 1620.0, 212.0, 99.0, 62.0, 42.0, 45.0, 21.0, 50.0, 24.0, 24.0, 34.0, 31.0, 19.0, 10.0, 18.0, 12.0, 7.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-9.890625, -9.555419921875, -9.22021484375, -8.885009765625, -8.5498046875, -8.214599609375, -7.87939453125, -7.544189453125, -7.208984375, -6.873779296875, -6.53857421875, -6.203369140625, -5.8681640625, -5.532958984375, -5.19775390625, -4.862548828125, -4.52734375, -4.192138671875, -3.85693359375, -3.521728515625, -3.1865234375, -2.851318359375, -2.51611328125, -2.180908203125, -1.845703125, -1.510498046875, -1.17529296875, -0.840087890625, -0.5048828125, -0.169677734375, 0.16552734375, 0.500732421875, 0.8359375, 1.171142578125, 1.50634765625, 1.841552734375, 2.1767578125, 2.511962890625, 2.84716796875, 3.182373046875, 3.517578125, 3.852783203125, 4.18798828125, 4.523193359375, 4.8583984375, 5.193603515625, 5.52880859375, 5.864013671875, 6.19921875, 6.534423828125, 6.86962890625, 7.204833984375, 7.5400390625, 7.875244140625, 8.21044921875, 8.545654296875, 8.880859375, 9.216064453125, 9.55126953125, 9.886474609375, 10.2216796875, 10.556884765625, 10.89208984375, 11.227294921875, 11.5625]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 2.0, 15.0, 11.0, 15.0, 25.0, 27.0, 20.0, 25.0, 30.0, 45.0, 46.0, 74.0, 105.0, 264.0, 936.0, 54167.0, 3086244.0, 2623.0, 465.0, 155.0, 80.0, 57.0, 45.0, 30.0, 25.0, 26.0, 26.0, 21.0, 18.0, 14.0, 13.0, 9.0, 8.0, 4.0, 7.0, 8.0, 7.0, 6.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-54.625, -53.0751953125, -51.525390625, -49.9755859375, -48.42578125, -46.8759765625, -45.326171875, -43.7763671875, -42.2265625, -40.6767578125, -39.126953125, -37.5771484375, -36.02734375, -34.4775390625, -32.927734375, -31.3779296875, -29.828125, -28.2783203125, -26.728515625, -25.1787109375, -23.62890625, -22.0791015625, -20.529296875, -18.9794921875, -17.4296875, -15.8798828125, -14.330078125, -12.7802734375, -11.23046875, -9.6806640625, -8.130859375, -6.5810546875, -5.03125, -3.4814453125, -1.931640625, -0.3818359375, 1.16796875, 2.7177734375, 4.267578125, 5.8173828125, 7.3671875, 8.9169921875, 10.466796875, 12.0166015625, 13.56640625, 15.1162109375, 16.666015625, 18.2158203125, 19.765625, 21.3154296875, 22.865234375, 24.4150390625, 25.96484375, 27.5146484375, 29.064453125, 30.6142578125, 32.1640625, 33.7138671875, 35.263671875, 36.8134765625, 38.36328125, 39.9130859375, 41.462890625, 43.0126953125, 44.5625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 15.0, 85.0, 287.0, 390.0, 182.0, 40.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.37948989868164, -41.35315704345703, -40.326820373535156, -39.30048751831055, -38.27415084838867, -37.24781799316406, -36.22148132324219, -35.19514846801758, -34.16881561279297, -33.14248275756836, -32.116146087646484, -31.089811325073242, -30.0634765625, -29.03714370727539, -28.01080894470215, -26.984474182128906, -25.95813751220703, -24.93180274963379, -23.905467987060547, -22.879133224487305, -21.852798461914062, -20.826465606689453, -19.80013084411621, -18.77379608154297, -17.747461318969727, -16.721126556396484, -15.694791793823242, -14.668457984924316, -13.642123222351074, -12.615788459777832, -11.589454650878906, -10.563119888305664, -9.536781311035156, -8.510446548461914, -7.48411226272583, -6.457777976989746, -5.431443214416504, -4.405108451843262, -3.3787741661071777, -2.3524398803710938, -1.3261051177978516, -0.2997705936431885, 0.7265639305114746, 1.7528984546661377, 2.779232978820801, 3.805567741394043, 4.831902027130127, 5.858236312866211, 6.884571075439453, 7.910905838012695, 8.937240600585938, 9.963574409484863, 10.989909172058105, 12.016243934631348, 13.042577743530273, 14.068912506103516, 15.095247268676758, 16.12158203125, 17.147916793823242, 18.174251556396484, 19.200584411621094, 20.22692108154297, 21.253253936767578, 22.27958869934082, 23.305923461914062]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 5.0, 8.0, 6.0, 8.0, 6.0, 11.0, 14.0, 17.0, 15.0, 17.0, 25.0, 26.0, 36.0, 39.0, 33.0, 26.0, 32.0, 38.0, 41.0, 37.0, 31.0, 41.0, 44.0, 45.0, 44.0, 36.0, 37.0, 22.0, 39.0, 33.0, 32.0, 15.0, 21.0, 17.0, 13.0, 22.0, 11.0, 8.0, 12.0, 8.0, 10.0, 9.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-34.45158386230469, -33.41813278198242, -32.38468551635742, -31.351234436035156, -30.317785263061523, -29.28433609008789, -28.250885009765625, -27.217435836791992, -26.18398666381836, -25.150537490844727, -24.117088317871094, -23.083637237548828, -22.050188064575195, -21.016738891601562, -19.983287811279297, -18.949838638305664, -17.91638946533203, -16.8829402923584, -15.84949016571045, -14.8160400390625, -13.782590866088867, -12.749141693115234, -11.715691566467285, -10.682241439819336, -9.648792266845703, -8.61534309387207, -7.581892967224121, -6.54844331741333, -5.514993667602539, -4.481544017791748, -3.448094367980957, -2.414644718170166, -1.381195068359375, -0.347745418548584, 0.685704231262207, 1.719153881072998, 2.752603530883789, 3.78605318069458, 4.819502830505371, 5.852952480316162, 6.886402130126953, 7.919851779937744, 8.953301429748535, 9.986751556396484, 11.020200729370117, 12.05364990234375, 13.0871000289917, 14.120550155639648, 15.153999328613281, 16.187448501586914, 17.220897674560547, 18.254348754882812, 19.287797927856445, 20.321247100830078, 21.354698181152344, 22.388147354125977, 23.42159652709961, 24.455045700073242, 25.488494873046875, 26.52194595336914, 27.555395126342773, 28.588844299316406, 29.622295379638672, 30.655744552612305, 31.689193725585938]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 10.0, 10.0, 5.0, 10.0, 11.0, 17.0, 10.0, 15.0, 15.0, 20.0, 27.0, 25.0, 32.0, 26.0, 39.0, 36.0, 26.0, 32.0, 44.0, 44.0, 42.0, 42.0, 43.0, 31.0, 34.0, 45.0, 30.0, 40.0, 40.0, 29.0, 14.0, 18.0, 24.0, 15.0, 24.0, 19.0, 11.0, 8.0, 11.0, 11.0, 3.0, 5.0, 0.0, 7.0, 4.0, 0.0, 2.0, 1.0, 3.0], "bins": [-4.0, -3.88897705078125, -3.7779541015625, -3.66693115234375, -3.555908203125, -3.44488525390625, -3.3338623046875, -3.22283935546875, -3.11181640625, -3.00079345703125, -2.8897705078125, -2.77874755859375, -2.667724609375, -2.55670166015625, -2.4456787109375, -2.33465576171875, -2.2236328125, -2.11260986328125, -2.0015869140625, -1.89056396484375, -1.779541015625, -1.66851806640625, -1.5574951171875, -1.44647216796875, -1.33544921875, -1.22442626953125, -1.1134033203125, -1.00238037109375, -0.891357421875, -0.78033447265625, -0.6693115234375, -0.55828857421875, -0.447265625, -0.33624267578125, -0.2252197265625, -0.11419677734375, -0.003173828125, 0.10784912109375, 0.2188720703125, 0.32989501953125, 0.44091796875, 0.55194091796875, 0.6629638671875, 0.77398681640625, 0.885009765625, 0.99603271484375, 1.1070556640625, 1.21807861328125, 1.3291015625, 1.44012451171875, 1.5511474609375, 1.66217041015625, 1.773193359375, 1.88421630859375, 1.9952392578125, 2.10626220703125, 2.21728515625, 2.32830810546875, 2.4393310546875, 2.55035400390625, 2.661376953125, 2.77239990234375, 2.8834228515625, 2.99444580078125, 3.10546875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 7.0, 2.0, 10.0, 10.0, 12.0, 9.0, 10.0, 14.0, 34.0, 39.0, 61.0, 68.0, 112.0, 144.0, 195.0, 321.0, 518.0, 906.0, 1546.0, 2938.0, 5949.0, 13642.0, 43580.0, 397314.0, 3258634.0, 397955.0, 44037.0, 13884.0, 5842.0, 2747.0, 1472.0, 806.0, 482.0, 310.0, 159.0, 151.0, 109.0, 78.0, 32.0, 43.0, 31.0, 26.0, 8.0, 10.0, 8.0, 5.0, 4.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.828125, -17.279541015625, -16.73095703125, -16.182373046875, -15.6337890625, -15.085205078125, -14.53662109375, -13.988037109375, -13.439453125, -12.890869140625, -12.34228515625, -11.793701171875, -11.2451171875, -10.696533203125, -10.14794921875, -9.599365234375, -9.05078125, -8.502197265625, -7.95361328125, -7.405029296875, -6.8564453125, -6.307861328125, -5.75927734375, -5.210693359375, -4.662109375, -4.113525390625, -3.56494140625, -3.016357421875, -2.4677734375, -1.919189453125, -1.37060546875, -0.822021484375, -0.2734375, 0.275146484375, 0.82373046875, 1.372314453125, 1.9208984375, 2.469482421875, 3.01806640625, 3.566650390625, 4.115234375, 4.663818359375, 5.21240234375, 5.760986328125, 6.3095703125, 6.858154296875, 7.40673828125, 7.955322265625, 8.50390625, 9.052490234375, 9.60107421875, 10.149658203125, 10.6982421875, 11.246826171875, 11.79541015625, 12.343994140625, 12.892578125, 13.441162109375, 13.98974609375, 14.538330078125, 15.0869140625, 15.635498046875, 16.18408203125, 16.732666015625, 17.28125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 14.0, 22.0, 54.0, 104.0, 226.0, 484.0, 996.0, 1128.0, 581.0, 266.0, 106.0, 60.0, 21.0, 15.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.875, -42.753662109375, -41.63232421875, -40.510986328125, -39.3896484375, -38.268310546875, -37.14697265625, -36.025634765625, -34.904296875, -33.782958984375, -32.66162109375, -31.540283203125, -30.4189453125, -29.297607421875, -28.17626953125, -27.054931640625, -25.93359375, -24.812255859375, -23.69091796875, -22.569580078125, -21.4482421875, -20.326904296875, -19.20556640625, -18.084228515625, -16.962890625, -15.841552734375, -14.72021484375, -13.598876953125, -12.4775390625, -11.356201171875, -10.23486328125, -9.113525390625, -7.9921875, -6.870849609375, -5.74951171875, -4.628173828125, -3.5068359375, -2.385498046875, -1.26416015625, -0.142822265625, 0.978515625, 2.099853515625, 3.22119140625, 4.342529296875, 5.4638671875, 6.585205078125, 7.70654296875, 8.827880859375, 9.94921875, 11.070556640625, 12.19189453125, 13.313232421875, 14.4345703125, 15.555908203125, 16.67724609375, 17.798583984375, 18.919921875, 20.041259765625, 21.16259765625, 22.283935546875, 23.4052734375, 24.526611328125, 25.64794921875, 26.769287109375, 27.890625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 3.0, 14.0, 22.0, 35.0, 52.0, 145.0, 357.0, 1841.0, 4157210.0, 33490.0, 675.0, 233.0, 90.0, 64.0, 29.0, 15.0, 10.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.71875, -51.34423828125, -46.9697265625, -42.59521484375, -38.220703125, -33.84619140625, -29.4716796875, -25.09716796875, -20.72265625, -16.34814453125, -11.9736328125, -7.59912109375, -3.224609375, 1.14990234375, 5.5244140625, 9.89892578125, 14.2734375, 18.64794921875, 23.0224609375, 27.39697265625, 31.771484375, 36.14599609375, 40.5205078125, 44.89501953125, 49.26953125, 53.64404296875, 58.0185546875, 62.39306640625, 66.767578125, 71.14208984375, 75.5166015625, 79.89111328125, 84.265625, 88.64013671875, 93.0146484375, 97.38916015625, 101.763671875, 106.13818359375, 110.5126953125, 114.88720703125, 119.26171875, 123.63623046875, 128.0107421875, 132.38525390625, 136.759765625, 141.13427734375, 145.5087890625, 149.88330078125, 154.2578125, 158.63232421875, 163.0068359375, 167.38134765625, 171.755859375, 176.13037109375, 180.5048828125, 184.87939453125, 189.25390625, 193.62841796875, 198.0029296875, 202.37744140625, 206.751953125, 211.12646484375, 215.5009765625, 219.87548828125, 224.25]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 29.0, 138.0, 351.0, 320.0, 149.0, 15.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.679214477539062, -19.748876571655273, -15.818538665771484, -11.888201713562012, -7.957863807678223, -4.02752685546875, -0.09718894958496094, 3.833148956298828, 7.763486862182617, 11.693824768066406, 15.624162673950195, 19.554500579833984, 23.48483657836914, 27.41517448425293, 31.34551239013672, 35.275848388671875, 39.2061882019043, 43.13652420043945, 47.066864013671875, 50.99720001220703, 54.92753982543945, 58.85787582397461, 62.78821563720703, 66.71855163574219, 70.64888763427734, 74.5792236328125, 78.50955963134766, 82.43990325927734, 86.3702392578125, 90.30057525634766, 94.23091125488281, 98.1612548828125, 102.09159088134766, 106.02192687988281, 109.95226287841797, 113.88260650634766, 117.81294250488281, 121.74327850341797, 125.67361450195312, 129.6039581298828, 133.53428649902344, 137.46463012695312, 141.39495849609375, 145.32530212402344, 149.25563049316406, 153.18597412109375, 157.11631774902344, 161.04664611816406, 164.97698974609375, 168.90733337402344, 172.83766174316406, 176.76800537109375, 180.69833374023438, 184.62867736816406, 188.55902099609375, 192.48934936523438, 196.41969299316406, 200.35003662109375, 204.28036499023438, 208.21070861816406, 212.1410369873047, 216.07138061523438, 220.00172424316406, 223.9320526123047, 227.86239624023438]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 2.0, 6.0, 8.0, 7.0, 14.0, 12.0, 9.0, 19.0, 12.0, 21.0, 16.0, 33.0, 29.0, 26.0, 40.0, 35.0, 44.0, 46.0, 46.0, 41.0, 35.0, 38.0, 47.0, 45.0, 47.0, 38.0, 31.0, 32.0, 29.0, 27.0, 30.0, 29.0, 14.0, 17.0, 12.0, 14.0, 11.0, 8.0, 12.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.29497528076172, -45.63574981689453, -43.976524353027344, -42.31729507446289, -40.6580696105957, -38.998844146728516, -37.33961486816406, -35.680389404296875, -34.02116394042969, -32.3619384765625, -30.70271110534668, -29.04348373413086, -27.384258270263672, -25.725032806396484, -24.065805435180664, -22.406578063964844, -20.747352600097656, -19.08812713623047, -17.42889976501465, -15.769673347473145, -14.11044692993164, -12.451220512390137, -10.791994094848633, -9.132767677307129, -7.473541259765625, -5.814314842224121, -4.155088424682617, -2.4958620071411133, -0.8366355895996094, 0.8225908279418945, 2.4818172454833984, 4.141043663024902, 5.800270080566406, 7.45949649810791, 9.118722915649414, 10.777949333190918, 12.437175750732422, 14.096402168273926, 15.75562858581543, 17.41485595703125, 19.074081420898438, 20.733306884765625, 22.392534255981445, 24.051761627197266, 25.710987091064453, 27.37021255493164, 29.02943992614746, 30.68866729736328, 32.34789276123047, 34.007118225097656, 35.666343688964844, 37.3255729675293, 38.984798431396484, 40.64402389526367, 42.303253173828125, 43.96247863769531, 45.6217041015625, 47.28092956542969, 48.940155029296875, 50.59938430786133, 52.258609771728516, 53.9178352355957, 55.577064514160156, 57.236289978027344, 58.89551544189453]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 4.0, 11.0, 6.0, 9.0, 13.0, 17.0, 17.0, 17.0, 30.0, 24.0, 29.0, 26.0, 41.0, 27.0, 33.0, 28.0, 43.0, 43.0, 49.0, 46.0, 36.0, 45.0, 29.0, 26.0, 29.0, 42.0, 36.0, 23.0, 27.0, 20.0, 25.0, 22.0, 25.0, 15.0, 15.0, 7.0, 17.0, 9.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0], "bins": [-3.919921875, -3.80633544921875, -3.6927490234375, -3.57916259765625, -3.465576171875, -3.35198974609375, -3.2384033203125, -3.12481689453125, -3.01123046875, -2.89764404296875, -2.7840576171875, -2.67047119140625, -2.556884765625, -2.44329833984375, -2.3297119140625, -2.21612548828125, -2.1025390625, -1.98895263671875, -1.8753662109375, -1.76177978515625, -1.648193359375, -1.53460693359375, -1.4210205078125, -1.30743408203125, -1.19384765625, -1.08026123046875, -0.9666748046875, -0.85308837890625, -0.739501953125, -0.62591552734375, -0.5123291015625, -0.39874267578125, -0.28515625, -0.17156982421875, -0.0579833984375, 0.05560302734375, 0.169189453125, 0.28277587890625, 0.3963623046875, 0.50994873046875, 0.62353515625, 0.73712158203125, 0.8507080078125, 0.96429443359375, 1.077880859375, 1.19146728515625, 1.3050537109375, 1.41864013671875, 1.5322265625, 1.64581298828125, 1.7593994140625, 1.87298583984375, 1.986572265625, 2.10015869140625, 2.2137451171875, 2.32733154296875, 2.44091796875, 2.55450439453125, 2.6680908203125, 2.78167724609375, 2.895263671875, 3.00885009765625, 3.1224365234375, 3.23602294921875, 3.349609375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 8.0, 17.0, 16.0, 17.0, 41.0, 43.0, 68.0, 113.0, 181.0, 223.0, 320.0, 415.0, 607.0, 857.0, 1262.0, 1854.0, 2436.0, 3396.0, 4748.0, 6573.0, 9148.0, 12780.0, 18185.0, 26222.0, 38659.0, 58944.0, 91166.0, 137968.0, 176782.0, 150075.0, 100783.0, 64939.0, 42999.0, 28773.0, 19383.0, 13653.0, 9730.0, 6973.0, 5157.0, 3705.0, 2691.0, 1920.0, 1414.0, 1064.0, 729.0, 447.0, 354.0, 242.0, 164.0, 100.0, 73.0, 54.0, 38.0, 25.0, 15.0, 9.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.3486328125, -0.33686065673828125, -0.3250885009765625, -0.31331634521484375, -0.301544189453125, -0.28977203369140625, -0.2779998779296875, -0.26622772216796875, -0.25445556640625, -0.24268341064453125, -0.2309112548828125, -0.21913909912109375, -0.207366943359375, -0.19559478759765625, -0.1838226318359375, -0.17205047607421875, -0.1602783203125, -0.14850616455078125, -0.1367340087890625, -0.12496185302734375, -0.113189697265625, -0.10141754150390625, -0.0896453857421875, -0.07787322998046875, -0.06610107421875, -0.05432891845703125, -0.0425567626953125, -0.03078460693359375, -0.019012451171875, -0.00724029541015625, 0.0045318603515625, 0.01630401611328125, 0.028076171875, 0.03984832763671875, 0.0516204833984375, 0.06339263916015625, 0.075164794921875, 0.08693695068359375, 0.0987091064453125, 0.11048126220703125, 0.12225341796875, 0.13402557373046875, 0.1457977294921875, 0.15756988525390625, 0.169342041015625, 0.18111419677734375, 0.1928863525390625, 0.20465850830078125, 0.2164306640625, 0.22820281982421875, 0.2399749755859375, 0.25174713134765625, 0.263519287109375, 0.27529144287109375, 0.2870635986328125, 0.29883575439453125, 0.31060791015625, 0.32238006591796875, 0.3341522216796875, 0.34592437744140625, 0.357696533203125, 0.36946868896484375, 0.3812408447265625, 0.39301300048828125, 0.40478515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 4.0, 5.0, 6.0, 10.0, 12.0, 13.0, 16.0, 13.0, 19.0, 24.0, 31.0, 28.0, 29.0, 32.0, 43.0, 36.0, 49.0, 46.0, 40.0, 1066.0, 39.0, 47.0, 44.0, 39.0, 19.0, 37.0, 32.0, 37.0, 36.0, 31.0, 28.0, 24.0, 16.0, 12.0, 10.0, 12.0, 6.0, 10.0, 5.0, 7.0, 4.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.3671875, -2.2882080078125, -2.209228515625, -2.1302490234375, -2.05126953125, -1.9722900390625, -1.893310546875, -1.8143310546875, -1.7353515625, -1.6563720703125, -1.577392578125, -1.4984130859375, -1.41943359375, -1.3404541015625, -1.261474609375, -1.1824951171875, -1.103515625, -1.0245361328125, -0.945556640625, -0.8665771484375, -0.78759765625, -0.7086181640625, -0.629638671875, -0.5506591796875, -0.4716796875, -0.3927001953125, -0.313720703125, -0.2347412109375, -0.15576171875, -0.0767822265625, 0.002197265625, 0.0811767578125, 0.16015625, 0.2391357421875, 0.318115234375, 0.3970947265625, 0.47607421875, 0.5550537109375, 0.634033203125, 0.7130126953125, 0.7919921875, 0.8709716796875, 0.949951171875, 1.0289306640625, 1.10791015625, 1.1868896484375, 1.265869140625, 1.3448486328125, 1.423828125, 1.5028076171875, 1.581787109375, 1.6607666015625, 1.73974609375, 1.8187255859375, 1.897705078125, 1.9766845703125, 2.0556640625, 2.1346435546875, 2.213623046875, 2.2926025390625, 2.37158203125, 2.4505615234375, 2.529541015625, 2.6085205078125, 2.6875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 6.0, 3.0, 11.0, 6.0, 16.0, 16.0, 28.0, 49.0, 75.0, 102.0, 150.0, 198.0, 341.0, 509.0, 775.0, 1254.0, 1757.0, 2771.0, 4173.0, 6374.0, 10443.0, 16217.0, 26941.0, 45517.0, 79552.0, 138151.0, 1252265.0, 201938.0, 126859.0, 72483.0, 41738.0, 24469.0, 15015.0, 9401.0, 5939.0, 3937.0, 2546.0, 1701.0, 1171.0, 755.0, 492.0, 310.0, 229.0, 146.0, 90.0, 71.0, 46.0, 32.0, 18.0, 19.0, 14.0, 7.0, 2.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.44921875, -0.43597412109375, -0.4227294921875, -0.40948486328125, -0.396240234375, -0.38299560546875, -0.3697509765625, -0.35650634765625, -0.34326171875, -0.33001708984375, -0.3167724609375, -0.30352783203125, -0.290283203125, -0.27703857421875, -0.2637939453125, -0.25054931640625, -0.2373046875, -0.22406005859375, -0.2108154296875, -0.19757080078125, -0.184326171875, -0.17108154296875, -0.1578369140625, -0.14459228515625, -0.13134765625, -0.11810302734375, -0.1048583984375, -0.09161376953125, -0.078369140625, -0.06512451171875, -0.0518798828125, -0.03863525390625, -0.025390625, -0.01214599609375, 0.0010986328125, 0.01434326171875, 0.027587890625, 0.04083251953125, 0.0540771484375, 0.06732177734375, 0.08056640625, 0.09381103515625, 0.1070556640625, 0.12030029296875, 0.133544921875, 0.14678955078125, 0.1600341796875, 0.17327880859375, 0.1865234375, 0.19976806640625, 0.2130126953125, 0.22625732421875, 0.239501953125, 0.25274658203125, 0.2659912109375, 0.27923583984375, 0.29248046875, 0.30572509765625, 0.3189697265625, 0.33221435546875, 0.345458984375, 0.35870361328125, 0.3719482421875, 0.38519287109375, 0.3984375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 7.0, 7.0, 6.0, 12.0, 17.0, 23.0, 23.0, 32.0, 25.0, 40.0, 55.0, 55.0, 62.0, 47.0, 68.0, 33.0, 64.0, 52.0, 54.0, 54.0, 45.0, 32.0, 48.0, 27.0, 18.0, 23.0, 16.0, 10.0, 7.0, 7.0, 8.0, 3.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00133514404296875, -0.0012962818145751953, -0.0012574195861816406, -0.001218557357788086, -0.0011796951293945312, -0.0011408329010009766, -0.0011019706726074219, -0.0010631084442138672, -0.0010242462158203125, -0.0009853839874267578, -0.0009465217590332031, -0.0009076595306396484, -0.0008687973022460938, -0.0008299350738525391, -0.0007910728454589844, -0.0007522106170654297, -0.000713348388671875, -0.0006744861602783203, -0.0006356239318847656, -0.0005967617034912109, -0.0005578994750976562, -0.0005190372467041016, -0.0004801750183105469, -0.0004413127899169922, -0.0004024505615234375, -0.0003635883331298828, -0.0003247261047363281, -0.00028586387634277344, -0.00024700164794921875, -0.00020813941955566406, -0.00016927719116210938, -0.0001304149627685547, -9.1552734375e-05, -5.269050598144531e-05, -1.3828277587890625e-05, 2.5033950805664062e-05, 6.389617919921875e-05, 0.00010275840759277344, 0.00014162063598632812, 0.0001804828643798828, 0.0002193450927734375, 0.0002582073211669922, 0.0002970695495605469, 0.00033593177795410156, 0.00037479400634765625, 0.00041365623474121094, 0.0004525184631347656, 0.0004913806915283203, 0.000530242919921875, 0.0005691051483154297, 0.0006079673767089844, 0.0006468296051025391, 0.0006856918334960938, 0.0007245540618896484, 0.0007634162902832031, 0.0008022785186767578, 0.0008411407470703125, 0.0008800029754638672, 0.0009188652038574219, 0.0009577274322509766, 0.0009965896606445312, 0.001035451889038086, 0.0010743141174316406, 0.0011131763458251953, 0.00115203857421875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 2.0, 12.0, 8.0, 9.0, 9.0, 18.0, 29.0, 33.0, 53.0, 51.0, 88.0, 122.0, 188.0, 307.0, 768.0, 339127.0, 705930.0, 805.0, 327.0, 229.0, 114.0, 102.0, 48.0, 39.0, 28.0, 28.0, 18.0, 13.0, 9.0, 4.0, 8.0, 8.0, 7.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0318603515625, -0.03086566925048828, -0.029870986938476562, -0.028876304626464844, -0.027881622314453125, -0.026886940002441406, -0.025892257690429688, -0.02489757537841797, -0.02390289306640625, -0.02290821075439453, -0.021913528442382812, -0.020918846130371094, -0.019924163818359375, -0.018929481506347656, -0.017934799194335938, -0.01694011688232422, -0.0159454345703125, -0.014950752258300781, -0.013956069946289062, -0.012961387634277344, -0.011966705322265625, -0.010972023010253906, -0.009977340698242188, -0.008982658386230469, -0.00798797607421875, -0.006993293762207031, -0.0059986114501953125, -0.005003929138183594, -0.004009246826171875, -0.0030145645141601562, -0.0020198822021484375, -0.0010251998901367188, -3.0517578125e-05, 0.0009641647338867188, 0.0019588470458984375, 0.0029535293579101562, 0.003948211669921875, 0.004942893981933594, 0.0059375762939453125, 0.006932258605957031, 0.00792694091796875, 0.008921623229980469, 0.009916305541992188, 0.010910987854003906, 0.011905670166015625, 0.012900352478027344, 0.013895034790039062, 0.014889717102050781, 0.0158843994140625, 0.01687908172607422, 0.017873764038085938, 0.018868446350097656, 0.019863128662109375, 0.020857810974121094, 0.021852493286132812, 0.02284717559814453, 0.02384185791015625, 0.02483654022216797, 0.025831222534179688, 0.026825904846191406, 0.027820587158203125, 0.028815269470214844, 0.029809951782226562, 0.03080463409423828, 0.03179931640625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 894.0, 117.0], "bins": [-0.011344287544488907, -0.011163369752466679, -0.01098245196044445, -0.010801534168422222, -0.010620616376399994, -0.01043969951570034, -0.010258780792355537, -0.010077863931655884, -0.009896946139633656, -0.009716028347611427, -0.009535110555589199, -0.00935419276356697, -0.009173274971544743, -0.008992357179522514, -0.00881144031882286, -0.008630522526800632, -0.008449604734778404, -0.008268686942756176, -0.008087769150733948, -0.00790685135871172, -0.007725934032350779, -0.00754501624032855, -0.007364098448306322, -0.007183180656284094, -0.007002262398600578, -0.00682134460657835, -0.006640426814556122, -0.006459509022533894, -0.006278591696172953, -0.006097673904150724, -0.005916756112128496, -0.005735838320106268, -0.005554920993745327, -0.005374003201723099, -0.0051930854097008705, -0.005012167617678642, -0.004831250291317701, -0.004650332499295473, -0.004469414707273245, -0.004288496915251017, -0.004107579588890076, -0.0039266617968678474, -0.003745744237676263, -0.0035648264456540346, -0.00338390888646245, -0.003202991094440222, -0.0030220733024179935, -0.0028411555103957653, -0.002660237718373537, -0.002479319926351309, -0.0022984023671597242, -0.002117484575137496, -0.0019365668995305896, -0.0017556492239236832, -0.001574731431901455, -0.0013938137562945485, -0.001212896080687642, -0.0010319784050807357, -0.0008510606712661684, -0.000670142937451601, -0.0004892252618446946, -0.0003083075862377882, -0.00012738979421555996, 5.3527881391346455e-05, 0.00023444551334250718]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 15.0, 9.0, 15.0, 17.0, 21.0, 19.0, 30.0, 29.0, 32.0, 31.0, 38.0, 31.0, 42.0, 36.0, 36.0, 45.0, 41.0, 59.0, 44.0, 35.0, 36.0, 30.0, 35.0, 48.0, 21.0, 25.0, 32.0, 13.0, 20.0, 18.0, 23.0, 10.0, 10.0, 9.0, 10.0, 8.0, 4.0, 5.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006972551345825195, -0.0006773583590984344, -0.0006574615836143494, -0.0006375648081302643, -0.0006176680326461792, -0.0005977712571620941, -0.000577874481678009, -0.000557977706193924, -0.0005380809307098389, -0.0005181841552257538, -0.0004982873797416687, -0.0004783906042575836, -0.00045849382877349854, -0.00043859705328941345, -0.00041870027780532837, -0.0003988035023212433, -0.0003789067268371582, -0.0003590099513530731, -0.00033911317586898804, -0.00031921640038490295, -0.00029931962490081787, -0.0002794228494167328, -0.0002595260739326477, -0.00023962929844856262, -0.00021973252296447754, -0.00019983574748039246, -0.00017993897199630737, -0.0001600421965122223, -0.0001401454210281372, -0.00012024864554405212, -0.00010035187005996704, -8.045509457588196e-05, -6.0558319091796875e-05, -4.066154360771179e-05, -2.076476812362671e-05, -8.67992639541626e-07, 1.9028782844543457e-05, 3.892555832862854e-05, 5.882233381271362e-05, 7.87191092967987e-05, 9.861588478088379e-05, 0.00011851266026496887, 0.00013840943574905396, 0.00015830621123313904, 0.00017820298671722412, 0.0001980997622013092, 0.0002179965376853943, 0.00023789331316947937, 0.00025779008865356445, 0.00027768686413764954, 0.0002975836396217346, 0.0003174804151058197, 0.0003373771905899048, 0.00035727396607398987, 0.00037717074155807495, 0.00039706751704216003, 0.0004169642925262451, 0.0004368610680103302, 0.0004567578434944153, 0.00047665461897850037, 0.0004965513944625854, 0.0005164481699466705, 0.0005363449454307556, 0.0005562417209148407, 0.0005761384963989258]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 5.0, 4.0, 11.0, 6.0, 9.0, 13.0, 17.0, 17.0, 17.0, 30.0, 24.0, 29.0, 26.0, 41.0, 27.0, 33.0, 28.0, 43.0, 43.0, 49.0, 46.0, 36.0, 45.0, 29.0, 26.0, 29.0, 42.0, 36.0, 23.0, 27.0, 20.0, 25.0, 22.0, 25.0, 15.0, 15.0, 7.0, 17.0, 9.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 5.0, 4.0, 0.0, 0.0, 1.0], "bins": [-3.919921875, -3.80633544921875, -3.6927490234375, -3.57916259765625, -3.465576171875, -3.35198974609375, -3.2384033203125, -3.12481689453125, -3.01123046875, -2.89764404296875, -2.7840576171875, -2.67047119140625, -2.556884765625, -2.44329833984375, -2.3297119140625, -2.21612548828125, -2.1025390625, -1.98895263671875, -1.8753662109375, -1.76177978515625, -1.648193359375, -1.53460693359375, -1.4210205078125, -1.30743408203125, -1.19384765625, -1.08026123046875, -0.9666748046875, -0.85308837890625, -0.739501953125, -0.62591552734375, -0.5123291015625, -0.39874267578125, -0.28515625, -0.17156982421875, -0.0579833984375, 0.05560302734375, 0.169189453125, 0.28277587890625, 0.3963623046875, 0.50994873046875, 0.62353515625, 0.73712158203125, 0.8507080078125, 0.96429443359375, 1.077880859375, 1.19146728515625, 1.3050537109375, 1.41864013671875, 1.5322265625, 1.64581298828125, 1.7593994140625, 1.87298583984375, 1.986572265625, 2.10015869140625, 2.2137451171875, 2.32733154296875, 2.44091796875, 2.55450439453125, 2.6680908203125, 2.78167724609375, 2.895263671875, 3.00885009765625, 3.1224365234375, 3.23602294921875, 3.349609375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 17.0, 14.0, 8.0, 23.0, 34.0, 27.0, 49.0, 69.0, 75.0, 126.0, 189.0, 239.0, 334.0, 538.0, 942.0, 1646.0, 3571.0, 8568.0, 25482.0, 84687.0, 315972.0, 430284.0, 120356.0, 34334.0, 11543.0, 4372.0, 1975.0, 1097.0, 634.0, 400.0, 285.0, 155.0, 112.0, 106.0, 86.0, 44.0, 39.0, 29.0, 25.0, 27.0, 12.0, 9.0, 8.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.904296875, -3.786468505859375, -3.66864013671875, -3.550811767578125, -3.4329833984375, -3.315155029296875, -3.19732666015625, -3.079498291015625, -2.961669921875, -2.843841552734375, -2.72601318359375, -2.608184814453125, -2.4903564453125, -2.372528076171875, -2.25469970703125, -2.136871337890625, -2.01904296875, -1.901214599609375, -1.78338623046875, -1.665557861328125, -1.5477294921875, -1.429901123046875, -1.31207275390625, -1.194244384765625, -1.076416015625, -0.958587646484375, -0.84075927734375, -0.722930908203125, -0.6051025390625, -0.487274169921875, -0.36944580078125, -0.251617431640625, -0.1337890625, -0.015960693359375, 0.10186767578125, 0.219696044921875, 0.3375244140625, 0.455352783203125, 0.57318115234375, 0.691009521484375, 0.808837890625, 0.926666259765625, 1.04449462890625, 1.162322998046875, 1.2801513671875, 1.397979736328125, 1.51580810546875, 1.633636474609375, 1.75146484375, 1.869293212890625, 1.98712158203125, 2.104949951171875, 2.2227783203125, 2.340606689453125, 2.45843505859375, 2.576263427734375, 2.694091796875, 2.811920166015625, 2.92974853515625, 3.047576904296875, 3.1654052734375, 3.283233642578125, 3.40106201171875, 3.518890380859375, 3.63671875]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 14.0, 7.0, 7.0, 14.0, 18.0, 20.0, 17.0, 27.0, 27.0, 32.0, 46.0, 31.0, 51.0, 52.0, 45.0, 65.0, 405.0, 1623.0, 109.0, 62.0, 42.0, 46.0, 28.0, 35.0, 36.0, 27.0, 27.0, 18.0, 12.0, 22.0, 16.0, 16.0, 9.0, 11.0, 4.0, 5.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6015625, -13.150146484375, -12.69873046875, -12.247314453125, -11.7958984375, -11.344482421875, -10.89306640625, -10.441650390625, -9.990234375, -9.538818359375, -9.08740234375, -8.635986328125, -8.1845703125, -7.733154296875, -7.28173828125, -6.830322265625, -6.37890625, -5.927490234375, -5.47607421875, -5.024658203125, -4.5732421875, -4.121826171875, -3.67041015625, -3.218994140625, -2.767578125, -2.316162109375, -1.86474609375, -1.413330078125, -0.9619140625, -0.510498046875, -0.05908203125, 0.392333984375, 0.84375, 1.295166015625, 1.74658203125, 2.197998046875, 2.6494140625, 3.100830078125, 3.55224609375, 4.003662109375, 4.455078125, 4.906494140625, 5.35791015625, 5.809326171875, 6.2607421875, 6.712158203125, 7.16357421875, 7.614990234375, 8.06640625, 8.517822265625, 8.96923828125, 9.420654296875, 9.8720703125, 10.323486328125, 10.77490234375, 11.226318359375, 11.677734375, 12.129150390625, 12.58056640625, 13.031982421875, 13.4833984375, 13.934814453125, 14.38623046875, 14.837646484375, 15.2890625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 4.0, 4.0, 7.0, 6.0, 11.0, 18.0, 18.0, 15.0, 22.0, 16.0, 29.0, 32.0, 43.0, 56.0, 72.0, 103.0, 224.0, 545.0, 3076.0, 3079960.0, 59433.0, 1088.0, 343.0, 154.0, 106.0, 54.0, 47.0, 47.0, 32.0, 25.0, 20.0, 21.0, 15.0, 14.0, 7.0, 8.0, 11.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-35.25, -34.205810546875, -33.16162109375, -32.117431640625, -31.0732421875, -30.029052734375, -28.98486328125, -27.940673828125, -26.896484375, -25.852294921875, -24.80810546875, -23.763916015625, -22.7197265625, -21.675537109375, -20.63134765625, -19.587158203125, -18.54296875, -17.498779296875, -16.45458984375, -15.410400390625, -14.3662109375, -13.322021484375, -12.27783203125, -11.233642578125, -10.189453125, -9.145263671875, -8.10107421875, -7.056884765625, -6.0126953125, -4.968505859375, -3.92431640625, -2.880126953125, -1.8359375, -0.791748046875, 0.25244140625, 1.296630859375, 2.3408203125, 3.385009765625, 4.42919921875, 5.473388671875, 6.517578125, 7.561767578125, 8.60595703125, 9.650146484375, 10.6943359375, 11.738525390625, 12.78271484375, 13.826904296875, 14.87109375, 15.915283203125, 16.95947265625, 18.003662109375, 19.0478515625, 20.092041015625, 21.13623046875, 22.180419921875, 23.224609375, 24.268798828125, 25.31298828125, 26.357177734375, 27.4013671875, 28.445556640625, 29.48974609375, 30.533935546875, 31.578125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [461.0, 557.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.451602935791016, -0.1377124786376953, 4.176177978515625, 8.490068435668945, 12.803958892822266, 17.117849349975586, 21.431739807128906, 25.745630264282227, 30.059520721435547, 34.3734130859375, 38.68730163574219, 43.001190185546875, 47.31508255004883, 51.62897491455078, 55.94286346435547, 60.256752014160156, 64.57064819335938, 68.88453674316406, 73.19842529296875, 77.51232147216797, 81.82621002197266, 86.14009857177734, 90.45399475097656, 94.76788330078125, 99.08177185058594, 103.39566040039062, 107.70954895019531, 112.02344512939453, 116.33733367919922, 120.6512222290039, 124.96511840820312, 129.2790069580078, 133.5928955078125, 137.9067840576172, 142.22067260742188, 146.53456115722656, 150.84844970703125, 155.162353515625, 159.4762420654297, 163.79013061523438, 168.10401916503906, 172.41790771484375, 176.73179626464844, 181.04568481445312, 185.35958862304688, 189.67347717285156, 193.98736572265625, 198.30125427246094, 202.61514282226562, 206.9290313720703, 211.242919921875, 215.5568084716797, 219.87069702148438, 224.18460083007812, 228.4984893798828, 232.8123779296875, 237.1262664794922, 241.44015502929688, 245.75404357910156, 250.06793212890625, 254.3818359375, 258.6957092285156, 263.0096130371094, 267.323486328125, 271.63739013671875]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 6.0, 8.0, 5.0, 16.0, 8.0, 15.0, 23.0, 22.0, 17.0, 28.0, 36.0, 22.0, 22.0, 32.0, 37.0, 34.0, 31.0, 39.0, 32.0, 33.0, 38.0, 43.0, 33.0, 40.0, 41.0, 40.0, 30.0, 33.0, 28.0, 33.0, 23.0, 19.0, 19.0, 17.0, 15.0, 17.0, 13.0, 6.0, 6.0, 5.0, 7.0, 5.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-45.506263732910156, -44.218997955322266, -42.93173599243164, -41.64447021484375, -40.357208251953125, -39.069942474365234, -37.78268051147461, -36.49541473388672, -35.208152770996094, -33.9208869934082, -32.63362503051758, -31.34636116027832, -30.059097290039062, -28.771831512451172, -27.484567642211914, -26.197303771972656, -24.910037994384766, -23.622774124145508, -22.33551025390625, -21.048246383666992, -19.760982513427734, -18.473716735839844, -17.186452865600586, -15.899188995361328, -14.61192512512207, -13.324661254882812, -12.037397384643555, -10.75013256072998, -9.462868690490723, -8.175604820251465, -6.888340473175049, -5.601076126098633, -4.313812255859375, -3.026548147201538, -1.7392840385437012, -0.45201992988586426, 0.8352441787719727, 2.1225080490112305, 3.4097723960876465, 4.6970367431640625, 5.98430061340332, 7.271564483642578, 8.558828353881836, 9.84609317779541, 11.133357048034668, 12.420620918273926, 13.7078857421875, 14.995149612426758, 16.282413482666016, 17.569677352905273, 18.85694122314453, 20.14420509338379, 21.431468963623047, 22.718734741210938, 24.005998611450195, 25.293262481689453, 26.58052635192871, 27.86779022216797, 29.155054092407227, 30.442317962646484, 31.729583740234375, 33.016845703125, 34.30411148071289, 35.59137725830078, 36.878639221191406]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 10.0, 3.0, 6.0, 4.0, 9.0, 7.0, 7.0, 10.0, 18.0, 17.0, 18.0, 17.0, 26.0, 25.0, 34.0, 32.0, 32.0, 31.0, 25.0, 38.0, 38.0, 49.0, 53.0, 40.0, 38.0, 36.0, 33.0, 25.0, 37.0, 35.0, 35.0, 23.0, 24.0, 25.0, 18.0, 26.0, 24.0, 16.0, 9.0, 13.0, 8.0, 9.0, 8.0, 2.0, 7.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.98828125, -3.8714599609375, -3.754638671875, -3.6378173828125, -3.52099609375, -3.4041748046875, -3.287353515625, -3.1705322265625, -3.0537109375, -2.9368896484375, -2.820068359375, -2.7032470703125, -2.58642578125, -2.4696044921875, -2.352783203125, -2.2359619140625, -2.119140625, -2.0023193359375, -1.885498046875, -1.7686767578125, -1.65185546875, -1.5350341796875, -1.418212890625, -1.3013916015625, -1.1845703125, -1.0677490234375, -0.950927734375, -0.8341064453125, -0.71728515625, -0.6004638671875, -0.483642578125, -0.3668212890625, -0.25, -0.1331787109375, -0.016357421875, 0.1004638671875, 0.21728515625, 0.3341064453125, 0.450927734375, 0.5677490234375, 0.6845703125, 0.8013916015625, 0.918212890625, 1.0350341796875, 1.15185546875, 1.2686767578125, 1.385498046875, 1.5023193359375, 1.619140625, 1.7359619140625, 1.852783203125, 1.9696044921875, 2.08642578125, 2.2032470703125, 2.320068359375, 2.4368896484375, 2.5537109375, 2.6705322265625, 2.787353515625, 2.9041748046875, 3.02099609375, 3.1378173828125, 3.254638671875, 3.3714599609375, 3.48828125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 15.0, 11.0, 15.0, 18.0, 20.0, 28.0, 36.0, 51.0, 58.0, 87.0, 126.0, 255.0, 434.0, 1386.0, 9695.0, 170818.0, 3037240.0, 936887.0, 32438.0, 3038.0, 701.0, 296.0, 174.0, 124.0, 80.0, 60.0, 28.0, 37.0, 24.0, 13.0, 19.0, 23.0, 8.0, 5.0, 7.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9375, -15.435302734375, -14.93310546875, -14.430908203125, -13.9287109375, -13.426513671875, -12.92431640625, -12.422119140625, -11.919921875, -11.417724609375, -10.91552734375, -10.413330078125, -9.9111328125, -9.408935546875, -8.90673828125, -8.404541015625, -7.90234375, -7.400146484375, -6.89794921875, -6.395751953125, -5.8935546875, -5.391357421875, -4.88916015625, -4.386962890625, -3.884765625, -3.382568359375, -2.88037109375, -2.378173828125, -1.8759765625, -1.373779296875, -0.87158203125, -0.369384765625, 0.1328125, 0.635009765625, 1.13720703125, 1.639404296875, 2.1416015625, 2.643798828125, 3.14599609375, 3.648193359375, 4.150390625, 4.652587890625, 5.15478515625, 5.656982421875, 6.1591796875, 6.661376953125, 7.16357421875, 7.665771484375, 8.16796875, 8.670166015625, 9.17236328125, 9.674560546875, 10.1767578125, 10.678955078125, 11.18115234375, 11.683349609375, 12.185546875, 12.687744140625, 13.18994140625, 13.692138671875, 14.1943359375, 14.696533203125, 15.19873046875, 15.700927734375, 16.203125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 13.0, 10.0, 23.0, 41.0, 41.0, 75.0, 124.0, 158.0, 234.0, 341.0, 455.0, 584.0, 513.0, 404.0, 357.0, 247.0, 148.0, 110.0, 55.0, 42.0, 32.0, 17.0, 19.0, 11.0, 5.0, 4.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.125, -18.6197509765625, -18.114501953125, -17.6092529296875, -17.10400390625, -16.5987548828125, -16.093505859375, -15.5882568359375, -15.0830078125, -14.5777587890625, -14.072509765625, -13.5672607421875, -13.06201171875, -12.5567626953125, -12.051513671875, -11.5462646484375, -11.041015625, -10.5357666015625, -10.030517578125, -9.5252685546875, -9.02001953125, -8.5147705078125, -8.009521484375, -7.5042724609375, -6.9990234375, -6.4937744140625, -5.988525390625, -5.4832763671875, -4.97802734375, -4.4727783203125, -3.967529296875, -3.4622802734375, -2.95703125, -2.4517822265625, -1.946533203125, -1.4412841796875, -0.93603515625, -0.4307861328125, 0.074462890625, 0.5797119140625, 1.0849609375, 1.5902099609375, 2.095458984375, 2.6007080078125, 3.10595703125, 3.6112060546875, 4.116455078125, 4.6217041015625, 5.126953125, 5.6322021484375, 6.137451171875, 6.6427001953125, 7.14794921875, 7.6531982421875, 8.158447265625, 8.6636962890625, 9.1689453125, 9.6741943359375, 10.179443359375, 10.6846923828125, 11.18994140625, 11.6951904296875, 12.200439453125, 12.7056884765625, 13.2109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 10.0, 18.0, 17.0, 27.0, 29.0, 52.0, 82.0, 82.0, 142.0, 251.0, 553.0, 2006.0, 29550.0, 3273958.0, 875193.0, 10048.0, 1182.0, 440.0, 238.0, 111.0, 93.0, 51.0, 42.0, 28.0, 24.0, 11.0, 11.0, 4.0, 7.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.59375, -32.24169921875, -30.8896484375, -29.53759765625, -28.185546875, -26.83349609375, -25.4814453125, -24.12939453125, -22.77734375, -21.42529296875, -20.0732421875, -18.72119140625, -17.369140625, -16.01708984375, -14.6650390625, -13.31298828125, -11.9609375, -10.60888671875, -9.2568359375, -7.90478515625, -6.552734375, -5.20068359375, -3.8486328125, -2.49658203125, -1.14453125, 0.20751953125, 1.5595703125, 2.91162109375, 4.263671875, 5.61572265625, 6.9677734375, 8.31982421875, 9.671875, 11.02392578125, 12.3759765625, 13.72802734375, 15.080078125, 16.43212890625, 17.7841796875, 19.13623046875, 20.48828125, 21.84033203125, 23.1923828125, 24.54443359375, 25.896484375, 27.24853515625, 28.6005859375, 29.95263671875, 31.3046875, 32.65673828125, 34.0087890625, 35.36083984375, 36.712890625, 38.06494140625, 39.4169921875, 40.76904296875, 42.12109375, 43.47314453125, 44.8251953125, 46.17724609375, 47.529296875, 48.88134765625, 50.2333984375, 51.58544921875, 52.9375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 6.0, 21.0, 42.0, 63.0, 87.0, 152.0, 190.0, 174.0, 125.0, 74.0, 36.0, 27.0, 10.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.52871322631836, -24.427474975585938, -22.326236724853516, -20.224998474121094, -18.123760223388672, -16.02252197265625, -13.921281814575195, -11.820043563842773, -9.718805313110352, -7.61756706237793, -5.51632833480835, -3.4150896072387695, -1.3138513565063477, 0.7873868942260742, 2.8886260986328125, 4.989864349365234, 7.091102600097656, 9.192340850830078, 11.2935791015625, 13.394818305969238, 15.49605655670166, 17.597293853759766, 19.69853401184082, 21.799772262573242, 23.901010513305664, 26.002248764038086, 28.103487014770508, 30.204727172851562, 32.305965423583984, 34.407203674316406, 36.50844192504883, 38.60968017578125, 40.710914611816406, 42.81215286254883, 44.91339111328125, 47.01462936401367, 49.115867614746094, 51.217105865478516, 53.31834411621094, 55.419586181640625, 57.52082061767578, 59.6220588684082, 61.723297119140625, 63.82453536987305, 65.92577362060547, 68.02701568603516, 70.12825012207031, 72.2294921875, 74.33073425292969, 76.43197631835938, 78.53321075439453, 80.63445281982422, 82.73568725585938, 84.83692932128906, 86.93816375732422, 89.0394058227539, 91.14064025878906, 93.24188232421875, 95.3431167602539, 97.4443588256836, 99.54559326171875, 101.64683532714844, 103.7480697631836, 105.84931182861328, 107.95054626464844]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 2.0, 3.0, 3.0, 5.0, 8.0, 16.0, 15.0, 15.0, 7.0, 20.0, 27.0, 34.0, 29.0, 28.0, 19.0, 27.0, 32.0, 28.0, 38.0, 33.0, 42.0, 44.0, 46.0, 52.0, 37.0, 49.0, 41.0, 30.0, 26.0, 27.0, 29.0, 24.0, 20.0, 23.0, 19.0, 23.0, 11.0, 10.0, 13.0, 9.0, 9.0, 7.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-40.271270751953125, -39.05824279785156, -37.845211029052734, -36.63218307495117, -35.41915512084961, -34.20612335205078, -32.99309539794922, -31.780067443847656, -30.56703758239746, -29.354007720947266, -28.140979766845703, -26.927949905395508, -25.714920043945312, -24.50189208984375, -23.288862228393555, -22.07583236694336, -20.862804412841797, -19.6497745513916, -18.43674659729004, -17.223716735839844, -16.01068878173828, -14.797658920288086, -13.58462905883789, -12.371600151062012, -11.158571243286133, -9.945542335510254, -8.732513427734375, -7.51948356628418, -6.306454658508301, -5.093425750732422, -3.8803963661193848, -2.6673669815063477, -1.4543380737304688, -0.24130892753601074, 0.9717202186584473, 2.1847493648529053, 3.3977785110473633, 4.610807418823242, 5.823836803436279, 7.036866188049316, 8.249895095825195, 9.462924003601074, 10.675952911376953, 11.888982772827148, 13.102011680603027, 14.315040588378906, 15.528070449829102, 16.741100311279297, 17.95412826538086, 19.167158126831055, 20.380186080932617, 21.593215942382812, 22.806243896484375, 24.01927375793457, 25.232303619384766, 26.445331573486328, 27.658361434936523, 28.87139129638672, 30.08441925048828, 31.297449111938477, 32.51047897338867, 33.723506927490234, 34.9365348815918, 36.149566650390625, 37.36259460449219]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 3.0, 9.0, 11.0, 8.0, 12.0, 16.0, 16.0, 24.0, 24.0, 26.0, 28.0, 25.0, 27.0, 38.0, 33.0, 42.0, 44.0, 40.0, 51.0, 53.0, 44.0, 38.0, 45.0, 33.0, 38.0, 38.0, 29.0, 24.0, 26.0, 24.0, 16.0, 21.0, 14.0, 16.0, 11.0, 8.0, 12.0, 8.0, 5.0, 3.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.515625, -4.38385009765625, -4.2520751953125, -4.12030029296875, -3.988525390625, -3.85675048828125, -3.7249755859375, -3.59320068359375, -3.46142578125, -3.32965087890625, -3.1978759765625, -3.06610107421875, -2.934326171875, -2.80255126953125, -2.6707763671875, -2.53900146484375, -2.4072265625, -2.27545166015625, -2.1436767578125, -2.01190185546875, -1.880126953125, -1.74835205078125, -1.6165771484375, -1.48480224609375, -1.35302734375, -1.22125244140625, -1.0894775390625, -0.95770263671875, -0.825927734375, -0.69415283203125, -0.5623779296875, -0.43060302734375, -0.298828125, -0.16705322265625, -0.0352783203125, 0.09649658203125, 0.228271484375, 0.36004638671875, 0.4918212890625, 0.62359619140625, 0.75537109375, 0.88714599609375, 1.0189208984375, 1.15069580078125, 1.282470703125, 1.41424560546875, 1.5460205078125, 1.67779541015625, 1.8095703125, 1.94134521484375, 2.0731201171875, 2.20489501953125, 2.336669921875, 2.46844482421875, 2.6002197265625, 2.73199462890625, 2.86376953125, 2.99554443359375, 3.1273193359375, 3.25909423828125, 3.390869140625, 3.52264404296875, 3.6544189453125, 3.78619384765625, 3.91796875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 16.0, 13.0, 21.0, 32.0, 54.0, 93.0, 124.0, 204.0, 344.0, 527.0, 872.0, 1428.0, 2367.0, 3856.0, 6271.0, 10275.0, 17187.0, 28747.0, 49874.0, 90726.0, 168604.0, 248968.0, 184113.0, 100444.0, 54498.0, 31408.0, 18814.0, 11160.0, 6929.0, 4105.0, 2505.0, 1498.0, 939.0, 567.0, 341.0, 243.0, 149.0, 88.0, 51.0, 30.0, 23.0, 18.0, 10.0, 6.0, 8.0, 8.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6123046875, -0.5940704345703125, -0.575836181640625, -0.5576019287109375, -0.53936767578125, -0.5211334228515625, -0.502899169921875, -0.4846649169921875, -0.4664306640625, -0.4481964111328125, -0.429962158203125, -0.4117279052734375, -0.39349365234375, -0.3752593994140625, -0.357025146484375, -0.3387908935546875, -0.320556640625, -0.3023223876953125, -0.284088134765625, -0.2658538818359375, -0.24761962890625, -0.2293853759765625, -0.211151123046875, -0.1929168701171875, -0.1746826171875, -0.1564483642578125, -0.138214111328125, -0.1199798583984375, -0.10174560546875, -0.0835113525390625, -0.065277099609375, -0.0470428466796875, -0.02880859375, -0.0105743408203125, 0.007659912109375, 0.0258941650390625, 0.04412841796875, 0.0623626708984375, 0.080596923828125, 0.0988311767578125, 0.1170654296875, 0.1352996826171875, 0.153533935546875, 0.1717681884765625, 0.19000244140625, 0.2082366943359375, 0.226470947265625, 0.2447052001953125, 0.262939453125, 0.2811737060546875, 0.299407958984375, 0.3176422119140625, 0.33587646484375, 0.3541107177734375, 0.372344970703125, 0.3905792236328125, 0.4088134765625, 0.4270477294921875, 0.445281982421875, 0.4635162353515625, 0.48175048828125, 0.4999847412109375, 0.518218994140625, 0.5364532470703125, 0.5546875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 7.0, 2.0, 6.0, 12.0, 17.0, 13.0, 9.0, 17.0, 17.0, 15.0, 27.0, 34.0, 28.0, 28.0, 41.0, 36.0, 41.0, 40.0, 39.0, 56.0, 1064.0, 46.0, 43.0, 51.0, 39.0, 42.0, 35.0, 34.0, 23.0, 26.0, 31.0, 21.0, 16.0, 14.0, 17.0, 10.0, 11.0, 9.0, 2.0, 1.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.818359375, -2.72821044921875, -2.6380615234375, -2.54791259765625, -2.457763671875, -2.36761474609375, -2.2774658203125, -2.18731689453125, -2.09716796875, -2.00701904296875, -1.9168701171875, -1.82672119140625, -1.736572265625, -1.64642333984375, -1.5562744140625, -1.46612548828125, -1.3759765625, -1.28582763671875, -1.1956787109375, -1.10552978515625, -1.015380859375, -0.92523193359375, -0.8350830078125, -0.74493408203125, -0.65478515625, -0.56463623046875, -0.4744873046875, -0.38433837890625, -0.294189453125, -0.20404052734375, -0.1138916015625, -0.02374267578125, 0.06640625, 0.15655517578125, 0.2467041015625, 0.33685302734375, 0.427001953125, 0.51715087890625, 0.6072998046875, 0.69744873046875, 0.78759765625, 0.87774658203125, 0.9678955078125, 1.05804443359375, 1.148193359375, 1.23834228515625, 1.3284912109375, 1.41864013671875, 1.5087890625, 1.59893798828125, 1.6890869140625, 1.77923583984375, 1.869384765625, 1.95953369140625, 2.0496826171875, 2.13983154296875, 2.22998046875, 2.32012939453125, 2.4102783203125, 2.50042724609375, 2.590576171875, 2.68072509765625, 2.7708740234375, 2.86102294921875, 2.951171875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 2.0, 4.0, 4.0, 17.0, 18.0, 28.0, 38.0, 84.0, 102.0, 151.0, 215.0, 379.0, 663.0, 955.0, 1595.0, 2639.0, 4529.0, 7365.0, 12734.0, 21918.0, 39480.0, 73793.0, 142443.0, 1286603.0, 224856.0, 125877.0, 66207.0, 35265.0, 20139.0, 11547.0, 6987.0, 4109.0, 2430.0, 1493.0, 914.0, 578.0, 356.0, 222.0, 124.0, 103.0, 62.0, 36.0, 19.0, 21.0, 8.0, 6.0, 8.0, 6.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5068359375, -0.48989105224609375, -0.4729461669921875, -0.45600128173828125, -0.439056396484375, -0.42211151123046875, -0.4051666259765625, -0.38822174072265625, -0.37127685546875, -0.35433197021484375, -0.3373870849609375, -0.32044219970703125, -0.303497314453125, -0.28655242919921875, -0.2696075439453125, -0.25266265869140625, -0.2357177734375, -0.21877288818359375, -0.2018280029296875, -0.18488311767578125, -0.167938232421875, -0.15099334716796875, -0.1340484619140625, -0.11710357666015625, -0.10015869140625, -0.08321380615234375, -0.0662689208984375, -0.04932403564453125, -0.032379150390625, -0.01543426513671875, 0.0015106201171875, 0.01845550537109375, 0.035400390625, 0.05234527587890625, 0.0692901611328125, 0.08623504638671875, 0.103179931640625, 0.12012481689453125, 0.1370697021484375, 0.15401458740234375, 0.17095947265625, 0.18790435791015625, 0.2048492431640625, 0.22179412841796875, 0.238739013671875, 0.25568389892578125, 0.2726287841796875, 0.28957366943359375, 0.3065185546875, 0.32346343994140625, 0.3404083251953125, 0.35735321044921875, 0.374298095703125, 0.39124298095703125, 0.4081878662109375, 0.42513275146484375, 0.44207763671875, 0.45902252197265625, 0.4759674072265625, 0.49291229248046875, 0.509857177734375, 0.5268020629882812, 0.5437469482421875, 0.5606918334960938, 0.57763671875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 7.0, 2.0, 5.0, 6.0, 9.0, 10.0, 13.0, 26.0, 22.0, 26.0, 26.0, 32.0, 47.0, 69.0, 60.0, 67.0, 69.0, 70.0, 71.0, 62.0, 50.0, 50.0, 41.0, 41.0, 22.0, 26.0, 16.0, 12.0, 12.0, 11.0, 4.0, 7.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013875961303710938, -0.0013415813446044922, -0.0012955665588378906, -0.001249551773071289, -0.0012035369873046875, -0.001157522201538086, -0.0011115074157714844, -0.0010654926300048828, -0.0010194778442382812, -0.0009734630584716797, -0.0009274482727050781, -0.0008814334869384766, -0.000835418701171875, -0.0007894039154052734, -0.0007433891296386719, -0.0006973743438720703, -0.0006513595581054688, -0.0006053447723388672, -0.0005593299865722656, -0.0005133152008056641, -0.0004673004150390625, -0.00042128562927246094, -0.0003752708435058594, -0.0003292560577392578, -0.00028324127197265625, -0.0002372264862060547, -0.00019121170043945312, -0.00014519691467285156, -9.918212890625e-05, -5.316734313964844e-05, -7.152557373046875e-06, 3.886222839355469e-05, 8.487701416015625e-05, 0.0001308917999267578, 0.00017690658569335938, 0.00022292137145996094, 0.0002689361572265625, 0.00031495094299316406, 0.0003609657287597656, 0.0004069805145263672, 0.00045299530029296875, 0.0004990100860595703, 0.0005450248718261719, 0.0005910396575927734, 0.000637054443359375, 0.0006830692291259766, 0.0007290840148925781, 0.0007750988006591797, 0.0008211135864257812, 0.0008671283721923828, 0.0009131431579589844, 0.0009591579437255859, 0.0010051727294921875, 0.001051187515258789, 0.0010972023010253906, 0.0011432170867919922, 0.0011892318725585938, 0.0012352466583251953, 0.0012812614440917969, 0.0013272762298583984, 0.001373291015625, 0.0014193058013916016, 0.0014653205871582031, 0.0015113353729248047, 0.0015573501586914062]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 6.0, 2.0, 9.0, 13.0, 16.0, 26.0, 37.0, 41.0, 56.0, 84.0, 144.0, 257.0, 423.0, 1611.0, 1042810.0, 1807.0, 488.0, 275.0, 119.0, 92.0, 53.0, 48.0, 30.0, 21.0, 18.0, 13.0, 12.0, 9.0, 9.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.038299560546875, -0.03718996047973633, -0.036080360412597656, -0.034970760345458984, -0.03386116027832031, -0.03275156021118164, -0.03164196014404297, -0.030532360076904297, -0.029422760009765625, -0.028313159942626953, -0.02720355987548828, -0.02609395980834961, -0.024984359741210938, -0.023874759674072266, -0.022765159606933594, -0.021655559539794922, -0.02054595947265625, -0.019436359405517578, -0.018326759338378906, -0.017217159271240234, -0.016107559204101562, -0.01499795913696289, -0.013888359069824219, -0.012778759002685547, -0.011669158935546875, -0.010559558868408203, -0.009449958801269531, -0.00834035873413086, -0.0072307586669921875, -0.006121158599853516, -0.005011558532714844, -0.003901958465576172, -0.0027923583984375, -0.0016827583312988281, -0.0005731582641601562, 0.0005364418029785156, 0.0016460418701171875, 0.0027556419372558594, 0.0038652420043945312, 0.004974842071533203, 0.006084442138671875, 0.007194042205810547, 0.008303642272949219, 0.00941324234008789, 0.010522842407226562, 0.011632442474365234, 0.012742042541503906, 0.013851642608642578, 0.01496124267578125, 0.016070842742919922, 0.017180442810058594, 0.018290042877197266, 0.019399642944335938, 0.02050924301147461, 0.02161884307861328, 0.022728443145751953, 0.023838043212890625, 0.024947643280029297, 0.02605724334716797, 0.02716684341430664, 0.028276443481445312, 0.029386043548583984, 0.030495643615722656, 0.03160524368286133, 0.03271484375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 7.0, 128.0, 553.0, 311.0, 17.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.005337605252861977, -0.005241822451353073, -0.005146039184182882, -0.005050256382673979, -0.004954473115503788, -0.0048586903139948845, -0.004762907512485981, -0.00466712424531579, -0.004571341443806887, -0.004475558642297983, -0.004379775375127792, -0.004283992573618889, -0.004188209306448698, -0.0040924265049397945, -0.003996643237769604, -0.0039008604362607002, -0.0038050771690905094, -0.0037092941347509623, -0.003613511100411415, -0.0035177282989025116, -0.0034219452645629644, -0.0033261622302234173, -0.00323037919588387, -0.003134596161544323, -0.0030388133600354195, -0.0029430303256958723, -0.002847247291356325, -0.0027514644898474216, -0.0026556814555078745, -0.0025598984211683273, -0.00246411538682878, -0.002368332352489233, -0.0022725495509803295, -0.0021767665166407824, -0.002080983482301235, -0.0019852006807923317, -0.0018894175300374627, -0.0017936346121132374, -0.0016978515777736902, -0.001602068543434143, -0.001506285509094596, -0.0014105024747550488, -0.0013147195568308234, -0.0012189365224912763, -0.001123153488151729, -0.0010273705702275038, -0.0009315875358879566, -0.0008358045015484095, -0.0007400214672088623, -0.0006442384910769761, -0.0005484554567374289, -0.00045267248060554266, -0.00035688947536982596, -0.00026110647013410926, -0.00016532349400222301, -6.954045966267586e-05, 2.6242516469210386e-05, 0.00012202551442896947, 0.00021780851238872856, 0.00031359150307253003, 0.00040937450830824673, 0.0005051575135439634, 0.0006009404896758497, 0.0006967235240153968, 0.0007925065001472831]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 10.0, 2.0, 7.0, 4.0, 12.0, 14.0, 14.0, 16.0, 20.0, 22.0, 29.0, 25.0, 40.0, 39.0, 30.0, 37.0, 25.0, 34.0, 32.0, 34.0, 42.0, 50.0, 40.0, 42.0, 48.0, 44.0, 43.0, 35.0, 25.0, 27.0, 35.0, 17.0, 20.0, 25.0, 16.0, 14.0, 3.0, 7.0, 9.0, 6.0, 3.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0006891489028930664, -0.0006665550172328949, -0.0006439611315727234, -0.0006213672459125519, -0.0005987733602523804, -0.0005761794745922089, -0.0005535855889320374, -0.0005309917032718658, -0.0005083978176116943, -0.00048580393195152283, -0.0004632100462913513, -0.0004406161606311798, -0.0004180222749710083, -0.0003954283893108368, -0.0003728345036506653, -0.0003502406179904938, -0.00032764673233032227, -0.00030505284667015076, -0.00028245896100997925, -0.00025986507534980774, -0.00023727118968963623, -0.00021467730402946472, -0.0001920834183692932, -0.0001694895327091217, -0.0001468956470489502, -0.0001243017613887787, -0.00010170787572860718, -7.911399006843567e-05, -5.652010440826416e-05, -3.392621874809265e-05, -1.1332333087921143e-05, 1.1261552572250366e-05, 3.3855438232421875e-05, 5.6449323892593384e-05, 7.904320955276489e-05, 0.0001016370952129364, 0.0001242309808731079, 0.00014682486653327942, 0.00016941875219345093, 0.00019201263785362244, 0.00021460652351379395, 0.00023720040917396545, 0.00025979429483413696, 0.00028238818049430847, 0.00030498206615448, 0.0003275759518146515, 0.000350169837474823, 0.0003727637231349945, 0.000395357608795166, 0.0004179514944553375, 0.00044054538011550903, 0.00046313926577568054, 0.00048573315143585205, 0.0005083270370960236, 0.0005309209227561951, 0.0005535148084163666, 0.0005761086940765381, 0.0005987025797367096, 0.0006212964653968811, 0.0006438903510570526, 0.0006664842367172241, 0.0006890781223773956, 0.0007116720080375671, 0.0007342658936977386, 0.0007568597793579102]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 7.0, 3.0, 9.0, 11.0, 8.0, 12.0, 16.0, 16.0, 24.0, 24.0, 26.0, 28.0, 25.0, 27.0, 38.0, 33.0, 42.0, 44.0, 40.0, 51.0, 53.0, 44.0, 38.0, 45.0, 33.0, 38.0, 38.0, 29.0, 24.0, 26.0, 24.0, 16.0, 21.0, 14.0, 16.0, 11.0, 8.0, 12.0, 8.0, 5.0, 3.0, 8.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.515625, -4.38385009765625, -4.2520751953125, -4.12030029296875, -3.988525390625, -3.85675048828125, -3.7249755859375, -3.59320068359375, -3.46142578125, -3.32965087890625, -3.1978759765625, -3.06610107421875, -2.934326171875, -2.80255126953125, -2.6707763671875, -2.53900146484375, -2.4072265625, -2.27545166015625, -2.1436767578125, -2.01190185546875, -1.880126953125, -1.74835205078125, -1.6165771484375, -1.48480224609375, -1.35302734375, -1.22125244140625, -1.0894775390625, -0.95770263671875, -0.825927734375, -0.69415283203125, -0.5623779296875, -0.43060302734375, -0.298828125, -0.16705322265625, -0.0352783203125, 0.09649658203125, 0.228271484375, 0.36004638671875, 0.4918212890625, 0.62359619140625, 0.75537109375, 0.88714599609375, 1.0189208984375, 1.15069580078125, 1.282470703125, 1.41424560546875, 1.5460205078125, 1.67779541015625, 1.8095703125, 1.94134521484375, 2.0731201171875, 2.20489501953125, 2.336669921875, 2.46844482421875, 2.6002197265625, 2.73199462890625, 2.86376953125, 2.99554443359375, 3.1273193359375, 3.25909423828125, 3.390869140625, 3.52264404296875, 3.6544189453125, 3.78619384765625, 3.91796875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 9.0, 8.0, 18.0, 20.0, 25.0, 32.0, 41.0, 81.0, 94.0, 131.0, 253.0, 366.0, 579.0, 887.0, 1451.0, 2504.0, 4499.0, 8220.0, 15789.0, 33796.0, 79771.0, 219307.0, 410146.0, 155601.0, 60120.0, 26091.0, 12702.0, 6803.0, 3595.0, 2043.0, 1308.0, 783.0, 470.0, 316.0, 219.0, 138.0, 112.0, 68.0, 47.0, 41.0, 24.0, 22.0, 14.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7890625, -2.7000732421875, -2.611083984375, -2.5220947265625, -2.43310546875, -2.3441162109375, -2.255126953125, -2.1661376953125, -2.0771484375, -1.9881591796875, -1.899169921875, -1.8101806640625, -1.72119140625, -1.6322021484375, -1.543212890625, -1.4542236328125, -1.365234375, -1.2762451171875, -1.187255859375, -1.0982666015625, -1.00927734375, -0.9202880859375, -0.831298828125, -0.7423095703125, -0.6533203125, -0.5643310546875, -0.475341796875, -0.3863525390625, -0.29736328125, -0.2083740234375, -0.119384765625, -0.0303955078125, 0.05859375, 0.1475830078125, 0.236572265625, 0.3255615234375, 0.41455078125, 0.5035400390625, 0.592529296875, 0.6815185546875, 0.7705078125, 0.8594970703125, 0.948486328125, 1.0374755859375, 1.12646484375, 1.2154541015625, 1.304443359375, 1.3934326171875, 1.482421875, 1.5714111328125, 1.660400390625, 1.7493896484375, 1.83837890625, 1.9273681640625, 2.016357421875, 2.1053466796875, 2.1943359375, 2.2833251953125, 2.372314453125, 2.4613037109375, 2.55029296875, 2.6392822265625, 2.728271484375, 2.8172607421875, 2.90625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 6.0, 11.0, 16.0, 20.0, 18.0, 14.0, 27.0, 30.0, 22.0, 31.0, 31.0, 31.0, 41.0, 38.0, 46.0, 69.0, 168.0, 1741.0, 188.0, 67.0, 42.0, 50.0, 37.0, 43.0, 40.0, 29.0, 36.0, 26.0, 13.0, 12.0, 25.0, 14.0, 11.0, 7.0, 10.0, 6.0, 3.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0], "bins": [-17.96875, -17.489990234375, -17.01123046875, -16.532470703125, -16.0537109375, -15.574951171875, -15.09619140625, -14.617431640625, -14.138671875, -13.659912109375, -13.18115234375, -12.702392578125, -12.2236328125, -11.744873046875, -11.26611328125, -10.787353515625, -10.30859375, -9.829833984375, -9.35107421875, -8.872314453125, -8.3935546875, -7.914794921875, -7.43603515625, -6.957275390625, -6.478515625, -5.999755859375, -5.52099609375, -5.042236328125, -4.5634765625, -4.084716796875, -3.60595703125, -3.127197265625, -2.6484375, -2.169677734375, -1.69091796875, -1.212158203125, -0.7333984375, -0.254638671875, 0.22412109375, 0.702880859375, 1.181640625, 1.660400390625, 2.13916015625, 2.617919921875, 3.0966796875, 3.575439453125, 4.05419921875, 4.532958984375, 5.01171875, 5.490478515625, 5.96923828125, 6.447998046875, 6.9267578125, 7.405517578125, 7.88427734375, 8.363037109375, 8.841796875, 9.320556640625, 9.79931640625, 10.278076171875, 10.7568359375, 11.235595703125, 11.71435546875, 12.193115234375, 12.671875]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 10.0, 12.0, 13.0, 11.0, 24.0, 14.0, 24.0, 25.0, 40.0, 42.0, 58.0, 98.0, 148.0, 247.0, 540.0, 1974.0, 40585.0, 3059443.0, 39095.0, 1913.0, 555.0, 240.0, 160.0, 89.0, 60.0, 48.0, 47.0, 28.0, 22.0, 23.0, 21.0, 18.0, 18.0, 13.0, 4.0, 6.0, 2.0, 7.0, 2.0, 4.0, 3.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.65625, -20.86865234375, -20.0810546875, -19.29345703125, -18.505859375, -17.71826171875, -16.9306640625, -16.14306640625, -15.35546875, -14.56787109375, -13.7802734375, -12.99267578125, -12.205078125, -11.41748046875, -10.6298828125, -9.84228515625, -9.0546875, -8.26708984375, -7.4794921875, -6.69189453125, -5.904296875, -5.11669921875, -4.3291015625, -3.54150390625, -2.75390625, -1.96630859375, -1.1787109375, -0.39111328125, 0.396484375, 1.18408203125, 1.9716796875, 2.75927734375, 3.546875, 4.33447265625, 5.1220703125, 5.90966796875, 6.697265625, 7.48486328125, 8.2724609375, 9.06005859375, 9.84765625, 10.63525390625, 11.4228515625, 12.21044921875, 12.998046875, 13.78564453125, 14.5732421875, 15.36083984375, 16.1484375, 16.93603515625, 17.7236328125, 18.51123046875, 19.298828125, 20.08642578125, 20.8740234375, 21.66162109375, 22.44921875, 23.23681640625, 24.0244140625, 24.81201171875, 25.599609375, 26.38720703125, 27.1748046875, 27.96240234375, 28.75]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 6.0, 54.0, 323.0, 481.0, 140.0, 15.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.1624526977539, -78.21477508544922, -76.26709747314453, -74.31941986083984, -72.37174224853516, -70.424072265625, -68.47639465332031, -66.52871704101562, -64.58103942871094, -62.63336181640625, -60.68568420410156, -58.738006591796875, -56.79033279418945, -54.842655181884766, -52.89497756958008, -50.94729995727539, -48.9996223449707, -47.051944732666016, -45.10426712036133, -43.156593322753906, -41.20891571044922, -39.26123809814453, -37.313560485839844, -35.365882873535156, -33.41820526123047, -31.47052764892578, -29.522851943969727, -27.57517433166504, -25.627498626708984, -23.679821014404297, -21.73214340209961, -19.784465789794922, -17.836795806884766, -15.889119148254395, -13.941442489624023, -11.993764877319336, -10.046088218688965, -8.098411560058594, -6.150733947753906, -4.203057289123535, -2.255380630493164, -0.30770373344421387, 1.6399731636047363, 3.5876502990722656, 5.535326957702637, 7.483003616333008, 9.430681228637695, 11.378357887268066, 13.326034545898438, 15.273711204528809, 17.22138786315918, 19.169065475463867, 21.116741180419922, 23.06441879272461, 25.012096405029297, 26.959774017333984, 28.90744972229004, 30.855127334594727, 32.80280303955078, 34.75048065185547, 36.698158264160156, 38.645835876464844, 40.59351348876953, 42.54118728637695, 44.48886489868164]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 1.0, 8.0, 9.0, 10.0, 9.0, 20.0, 17.0, 9.0, 21.0, 29.0, 18.0, 27.0, 28.0, 25.0, 38.0, 30.0, 30.0, 30.0, 42.0, 38.0, 43.0, 38.0, 36.0, 43.0, 38.0, 34.0, 39.0, 24.0, 33.0, 22.0, 32.0, 25.0, 13.0, 22.0, 18.0, 11.0, 17.0, 17.0, 10.0, 7.0, 7.0, 6.0, 8.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-41.67333221435547, -40.28388214111328, -38.89442825317383, -37.50497817993164, -36.11552429199219, -34.72607421875, -33.33662033081055, -31.94717025756836, -30.557716369628906, -29.168264389038086, -27.778812408447266, -26.389360427856445, -24.999908447265625, -23.610456466674805, -22.221004486083984, -20.831554412841797, -19.442102432250977, -18.052650451660156, -16.663198471069336, -15.273746490478516, -13.884294509887695, -12.494842529296875, -11.105391502380371, -9.71593952178955, -8.32648754119873, -6.93703556060791, -5.54758358001709, -4.158132076263428, -2.7686800956726074, -1.379228115081787, 0.010223388671875, 1.3996753692626953, 2.7891273498535156, 4.178579330444336, 5.568031311035156, 6.957482814788818, 8.346935272216797, 9.736387252807617, 11.125838279724121, 12.515290260314941, 13.904742240905762, 15.294194221496582, 16.683645248413086, 18.073097229003906, 19.462549209594727, 20.852001190185547, 22.241453170776367, 23.630905151367188, 25.020357131958008, 26.409809112548828, 27.79926109313965, 29.18871307373047, 30.57816505432129, 31.96761703491211, 33.3570671081543, 34.74652099609375, 36.13597106933594, 37.525421142578125, 38.91487503051758, 40.304325103759766, 41.69377899169922, 43.083229064941406, 44.47268295288086, 45.86213302612305, 47.2515869140625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 4.0, 9.0, 8.0, 5.0, 9.0, 15.0, 11.0, 16.0, 27.0, 22.0, 29.0, 22.0, 38.0, 26.0, 19.0, 51.0, 37.0, 44.0, 47.0, 57.0, 44.0, 46.0, 43.0, 40.0, 37.0, 35.0, 33.0, 27.0, 32.0, 21.0, 27.0, 15.0, 20.0, 20.0, 9.0, 9.0, 9.0, 9.0, 11.0, 5.0, 4.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.85546875, -4.7171630859375, -4.578857421875, -4.4405517578125, -4.30224609375, -4.1639404296875, -4.025634765625, -3.8873291015625, -3.7490234375, -3.6107177734375, -3.472412109375, -3.3341064453125, -3.19580078125, -3.0574951171875, -2.919189453125, -2.7808837890625, -2.642578125, -2.5042724609375, -2.365966796875, -2.2276611328125, -2.08935546875, -1.9510498046875, -1.812744140625, -1.6744384765625, -1.5361328125, -1.3978271484375, -1.259521484375, -1.1212158203125, -0.98291015625, -0.8446044921875, -0.706298828125, -0.5679931640625, -0.4296875, -0.2913818359375, -0.153076171875, -0.0147705078125, 0.12353515625, 0.2618408203125, 0.400146484375, 0.5384521484375, 0.6767578125, 0.8150634765625, 0.953369140625, 1.0916748046875, 1.22998046875, 1.3682861328125, 1.506591796875, 1.6448974609375, 1.783203125, 1.9215087890625, 2.059814453125, 2.1981201171875, 2.33642578125, 2.4747314453125, 2.613037109375, 2.7513427734375, 2.8896484375, 3.0279541015625, 3.166259765625, 3.3045654296875, 3.44287109375, 3.5811767578125, 3.719482421875, 3.8577880859375, 3.99609375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 4.0, 11.0, 8.0, 9.0, 12.0, 16.0, 21.0, 14.0, 25.0, 20.0, 30.0, 29.0, 32.0, 36.0, 59.0, 117.0, 290.0, 1688.0, 46687.0, 3346457.0, 788261.0, 9141.0, 719.0, 170.0, 106.0, 57.0, 29.0, 22.0, 27.0, 19.0, 21.0, 28.0, 21.0, 15.0, 19.0, 7.0, 9.0, 4.0, 5.0, 5.0, 5.0, 7.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-25.34375, -24.593505859375, -23.84326171875, -23.093017578125, -22.3427734375, -21.592529296875, -20.84228515625, -20.092041015625, -19.341796875, -18.591552734375, -17.84130859375, -17.091064453125, -16.3408203125, -15.590576171875, -14.84033203125, -14.090087890625, -13.33984375, -12.589599609375, -11.83935546875, -11.089111328125, -10.3388671875, -9.588623046875, -8.83837890625, -8.088134765625, -7.337890625, -6.587646484375, -5.83740234375, -5.087158203125, -4.3369140625, -3.586669921875, -2.83642578125, -2.086181640625, -1.3359375, -0.585693359375, 0.16455078125, 0.914794921875, 1.6650390625, 2.415283203125, 3.16552734375, 3.915771484375, 4.666015625, 5.416259765625, 6.16650390625, 6.916748046875, 7.6669921875, 8.417236328125, 9.16748046875, 9.917724609375, 10.66796875, 11.418212890625, 12.16845703125, 12.918701171875, 13.6689453125, 14.419189453125, 15.16943359375, 15.919677734375, 16.669921875, 17.420166015625, 18.17041015625, 18.920654296875, 19.6708984375, 20.421142578125, 21.17138671875, 21.921630859375, 22.671875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 8.0, 13.0, 25.0, 33.0, 44.0, 66.0, 106.0, 171.0, 271.0, 427.0, 616.0, 688.0, 556.0, 374.0, 260.0, 149.0, 97.0, 61.0, 36.0, 32.0, 16.0, 15.0, 4.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.5625, -23.00634765625, -22.4501953125, -21.89404296875, -21.337890625, -20.78173828125, -20.2255859375, -19.66943359375, -19.11328125, -18.55712890625, -18.0009765625, -17.44482421875, -16.888671875, -16.33251953125, -15.7763671875, -15.22021484375, -14.6640625, -14.10791015625, -13.5517578125, -12.99560546875, -12.439453125, -11.88330078125, -11.3271484375, -10.77099609375, -10.21484375, -9.65869140625, -9.1025390625, -8.54638671875, -7.990234375, -7.43408203125, -6.8779296875, -6.32177734375, -5.765625, -5.20947265625, -4.6533203125, -4.09716796875, -3.541015625, -2.98486328125, -2.4287109375, -1.87255859375, -1.31640625, -0.76025390625, -0.2041015625, 0.35205078125, 0.908203125, 1.46435546875, 2.0205078125, 2.57666015625, 3.1328125, 3.68896484375, 4.2451171875, 4.80126953125, 5.357421875, 5.91357421875, 6.4697265625, 7.02587890625, 7.58203125, 8.13818359375, 8.6943359375, 9.25048828125, 9.806640625, 10.36279296875, 10.9189453125, 11.47509765625, 12.03125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 14.0, 15.0, 22.0, 25.0, 49.0, 57.0, 102.0, 141.0, 310.0, 606.0, 1993.0, 84018.0, 4045372.0, 58444.0, 1846.0, 577.0, 279.0, 139.0, 105.0, 67.0, 36.0, 12.0, 19.0, 17.0, 8.0, 4.0, 1.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.75, -48.00244140625, -46.2548828125, -44.50732421875, -42.759765625, -41.01220703125, -39.2646484375, -37.51708984375, -35.76953125, -34.02197265625, -32.2744140625, -30.52685546875, -28.779296875, -27.03173828125, -25.2841796875, -23.53662109375, -21.7890625, -20.04150390625, -18.2939453125, -16.54638671875, -14.798828125, -13.05126953125, -11.3037109375, -9.55615234375, -7.80859375, -6.06103515625, -4.3134765625, -2.56591796875, -0.818359375, 0.92919921875, 2.6767578125, 4.42431640625, 6.171875, 7.91943359375, 9.6669921875, 11.41455078125, 13.162109375, 14.90966796875, 16.6572265625, 18.40478515625, 20.15234375, 21.89990234375, 23.6474609375, 25.39501953125, 27.142578125, 28.89013671875, 30.6376953125, 32.38525390625, 34.1328125, 35.88037109375, 37.6279296875, 39.37548828125, 41.123046875, 42.87060546875, 44.6181640625, 46.36572265625, 48.11328125, 49.86083984375, 51.6083984375, 53.35595703125, 55.103515625, 56.85107421875, 58.5986328125, 60.34619140625, 62.09375]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 14.0, 17.0, 28.0, 65.0, 87.0, 128.0, 119.0, 148.0, 132.0, 112.0, 62.0, 35.0, 26.0, 16.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-93.03020477294922, -91.1414794921875, -89.25274658203125, -87.36402130126953, -85.47528839111328, -83.58656311035156, -81.69783020019531, -79.8091049194336, -77.92037963867188, -76.03165435791016, -74.1429214477539, -72.25419616699219, -70.36546325683594, -68.47673797607422, -66.58800506591797, -64.69927978515625, -62.810546875, -60.921817779541016, -59.03308868408203, -57.14435958862305, -55.25563049316406, -53.366905212402344, -51.47817611694336, -49.589447021484375, -47.70071792602539, -45.811988830566406, -43.92325973510742, -42.03453063964844, -40.14580535888672, -38.25707244873047, -36.36834716796875, -34.479618072509766, -32.59088897705078, -30.702159881591797, -28.813430786132812, -26.92470359802246, -25.035974502563477, -23.147245407104492, -21.25851821899414, -19.369789123535156, -17.481061935424805, -15.59233283996582, -13.703604698181152, -11.814876556396484, -9.9261474609375, -8.037418365478516, -6.148690223693848, -4.25996208190918, -2.3712329864501953, -0.48250436782836914, 1.406224250793457, 3.294952869415283, 5.183681488037109, 7.072410583496094, 8.961138725280762, 10.84986686706543, 12.738595962524414, 14.627325057983398, 16.51605224609375, 18.404781341552734, 20.29351043701172, 22.182239532470703, 24.070968627929688, 25.95969581604004, 27.848424911499023]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 8.0, 7.0, 6.0, 13.0, 17.0, 20.0, 18.0, 18.0, 31.0, 34.0, 24.0, 28.0, 45.0, 35.0, 36.0, 39.0, 55.0, 49.0, 51.0, 45.0, 51.0, 35.0, 44.0, 41.0, 40.0, 32.0, 38.0, 24.0, 21.0, 19.0, 10.0, 12.0, 13.0, 11.0, 11.0, 7.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.356170654296875, -45.92485809326172, -44.49354553222656, -43.062232971191406, -41.630916595458984, -40.19960403442383, -38.76829147338867, -37.336978912353516, -35.905662536621094, -34.47434997558594, -33.04303741455078, -31.611722946166992, -30.180408477783203, -28.749095916748047, -27.31778335571289, -25.886470794677734, -24.455158233642578, -23.023845672607422, -21.592531204223633, -20.161218643188477, -18.729904174804688, -17.29859161376953, -15.867279052734375, -14.435965538024902, -13.00465202331543, -11.573338508605957, -10.142024993896484, -8.710712432861328, -7.2793989181518555, -5.848085403442383, -4.416772842407227, -2.985459327697754, -1.5541458129882812, -0.1228325366973877, 1.3084807395935059, 2.7397937774658203, 4.171107292175293, 5.602420806884766, 7.033733367919922, 8.465046882629395, 9.896360397338867, 11.32767391204834, 12.758987426757812, 14.190299987792969, 15.621613502502441, 17.052927017211914, 18.48423957824707, 19.91555404663086, 21.346866607666016, 22.778179168701172, 24.20949363708496, 25.640806198120117, 27.072120666503906, 28.503433227539062, 29.93474578857422, 31.366058349609375, 32.79737091064453, 34.22868347167969, 35.659996032714844, 37.09130859375, 38.52262496948242, 39.95393753051758, 41.385250091552734, 42.81656265258789, 44.24787902832031]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 2.0, 8.0, 4.0, 5.0, 8.0, 9.0, 9.0, 14.0, 14.0, 17.0, 18.0, 27.0, 24.0, 26.0, 28.0, 30.0, 29.0, 41.0, 26.0, 35.0, 44.0, 36.0, 47.0, 45.0, 38.0, 37.0, 41.0, 36.0, 25.0, 40.0, 24.0, 26.0, 25.0, 20.0, 29.0, 16.0, 20.0, 15.0, 13.0, 13.0, 11.0, 2.0, 5.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3359375, -4.2042236328125, -4.072509765625, -3.9407958984375, -3.80908203125, -3.6773681640625, -3.545654296875, -3.4139404296875, -3.2822265625, -3.1505126953125, -3.018798828125, -2.8870849609375, -2.75537109375, -2.6236572265625, -2.491943359375, -2.3602294921875, -2.228515625, -2.0968017578125, -1.965087890625, -1.8333740234375, -1.70166015625, -1.5699462890625, -1.438232421875, -1.3065185546875, -1.1748046875, -1.0430908203125, -0.911376953125, -0.7796630859375, -0.64794921875, -0.5162353515625, -0.384521484375, -0.2528076171875, -0.12109375, 0.0106201171875, 0.142333984375, 0.2740478515625, 0.40576171875, 0.5374755859375, 0.669189453125, 0.8009033203125, 0.9326171875, 1.0643310546875, 1.196044921875, 1.3277587890625, 1.45947265625, 1.5911865234375, 1.722900390625, 1.8546142578125, 1.986328125, 2.1180419921875, 2.249755859375, 2.3814697265625, 2.51318359375, 2.6448974609375, 2.776611328125, 2.9083251953125, 3.0400390625, 3.1717529296875, 3.303466796875, 3.4351806640625, 3.56689453125, 3.6986083984375, 3.830322265625, 3.9620361328125, 4.09375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 22.0, 25.0, 35.0, 52.0, 69.0, 119.0, 168.0, 257.0, 340.0, 477.0, 726.0, 1075.0, 1625.0, 2347.0, 3306.0, 4829.0, 7150.0, 10695.0, 15801.0, 23919.0, 36792.0, 58911.0, 96417.0, 153541.0, 199542.0, 157717.0, 99149.0, 60425.0, 37847.0, 24544.0, 16457.0, 11060.0, 7429.0, 5035.0, 3395.0, 2223.0, 1618.0, 1062.0, 761.0, 518.0, 313.0, 246.0, 156.0, 104.0, 89.0, 49.0, 36.0, 23.0, 19.0, 11.0, 8.0, 7.0, 3.0, 4.0, 0.0, 0.0, 4.0], "bins": [-0.4912109375, -0.4756317138671875, -0.460052490234375, -0.4444732666015625, -0.42889404296875, -0.4133148193359375, -0.397735595703125, -0.3821563720703125, -0.3665771484375, -0.3509979248046875, -0.335418701171875, -0.3198394775390625, -0.30426025390625, -0.2886810302734375, -0.273101806640625, -0.2575225830078125, -0.241943359375, -0.2263641357421875, -0.210784912109375, -0.1952056884765625, -0.17962646484375, -0.1640472412109375, -0.148468017578125, -0.1328887939453125, -0.1173095703125, -0.1017303466796875, -0.086151123046875, -0.0705718994140625, -0.05499267578125, -0.0394134521484375, -0.023834228515625, -0.0082550048828125, 0.00732421875, 0.0229034423828125, 0.038482666015625, 0.0540618896484375, 0.06964111328125, 0.0852203369140625, 0.100799560546875, 0.1163787841796875, 0.1319580078125, 0.1475372314453125, 0.163116455078125, 0.1786956787109375, 0.19427490234375, 0.2098541259765625, 0.225433349609375, 0.2410125732421875, 0.256591796875, 0.2721710205078125, 0.287750244140625, 0.3033294677734375, 0.31890869140625, 0.3344879150390625, 0.350067138671875, 0.3656463623046875, 0.3812255859375, 0.3968048095703125, 0.412384033203125, 0.4279632568359375, 0.44354248046875, 0.4591217041015625, 0.474700927734375, 0.4902801513671875, 0.505859375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 10.0, 10.0, 11.0, 10.0, 15.0, 18.0, 13.0, 28.0, 23.0, 35.0, 28.0, 35.0, 32.0, 33.0, 35.0, 41.0, 41.0, 53.0, 1058.0, 35.0, 40.0, 43.0, 44.0, 40.0, 26.0, 34.0, 30.0, 26.0, 27.0, 23.0, 22.0, 17.0, 17.0, 13.0, 12.0, 5.0, 8.0, 6.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8984375, -2.80938720703125, -2.7203369140625, -2.63128662109375, -2.542236328125, -2.45318603515625, -2.3641357421875, -2.27508544921875, -2.18603515625, -2.09698486328125, -2.0079345703125, -1.91888427734375, -1.829833984375, -1.74078369140625, -1.6517333984375, -1.56268310546875, -1.4736328125, -1.38458251953125, -1.2955322265625, -1.20648193359375, -1.117431640625, -1.02838134765625, -0.9393310546875, -0.85028076171875, -0.76123046875, -0.67218017578125, -0.5831298828125, -0.49407958984375, -0.405029296875, -0.31597900390625, -0.2269287109375, -0.13787841796875, -0.048828125, 0.04022216796875, 0.1292724609375, 0.21832275390625, 0.307373046875, 0.39642333984375, 0.4854736328125, 0.57452392578125, 0.66357421875, 0.75262451171875, 0.8416748046875, 0.93072509765625, 1.019775390625, 1.10882568359375, 1.1978759765625, 1.28692626953125, 1.3759765625, 1.46502685546875, 1.5540771484375, 1.64312744140625, 1.732177734375, 1.82122802734375, 1.9102783203125, 1.99932861328125, 2.08837890625, 2.17742919921875, 2.2664794921875, 2.35552978515625, 2.444580078125, 2.53363037109375, 2.6226806640625, 2.71173095703125, 2.80078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 12.0, 19.0, 20.0, 36.0, 50.0, 70.0, 94.0, 163.0, 289.0, 445.0, 623.0, 1064.0, 1692.0, 2716.0, 4372.0, 7235.0, 11820.0, 20000.0, 34872.0, 61138.0, 110762.0, 193896.0, 1282796.0, 158338.0, 87208.0, 48318.0, 27648.0, 16314.0, 9504.0, 5821.0, 3620.0, 2252.0, 1384.0, 950.0, 561.0, 368.0, 224.0, 142.0, 107.0, 68.0, 44.0, 19.0, 17.0, 14.0, 7.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.552734375, -0.5356216430664062, -0.5185089111328125, -0.5013961791992188, -0.484283447265625, -0.46717071533203125, -0.4500579833984375, -0.43294525146484375, -0.41583251953125, -0.39871978759765625, -0.3816070556640625, -0.36449432373046875, -0.347381591796875, -0.33026885986328125, -0.3131561279296875, -0.29604339599609375, -0.2789306640625, -0.26181793212890625, -0.2447052001953125, -0.22759246826171875, -0.210479736328125, -0.19336700439453125, -0.1762542724609375, -0.15914154052734375, -0.14202880859375, -0.12491607666015625, -0.1078033447265625, -0.09069061279296875, -0.073577880859375, -0.05646514892578125, -0.0393524169921875, -0.02223968505859375, -0.005126953125, 0.01198577880859375, 0.0290985107421875, 0.04621124267578125, 0.063323974609375, 0.08043670654296875, 0.0975494384765625, 0.11466217041015625, 0.13177490234375, 0.14888763427734375, 0.1660003662109375, 0.18311309814453125, 0.200225830078125, 0.21733856201171875, 0.2344512939453125, 0.25156402587890625, 0.2686767578125, 0.28578948974609375, 0.3029022216796875, 0.32001495361328125, 0.337127685546875, 0.35424041748046875, 0.3713531494140625, 0.38846588134765625, 0.40557861328125, 0.42269134521484375, 0.4398040771484375, 0.45691680908203125, 0.474029541015625, 0.49114227294921875, 0.5082550048828125, 0.5253677368164062, 0.54248046875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 5.0, 3.0, 4.0, 9.0, 7.0, 11.0, 11.0, 12.0, 17.0, 23.0, 22.0, 23.0, 25.0, 39.0, 51.0, 45.0, 71.0, 42.0, 62.0, 46.0, 49.0, 56.0, 36.0, 49.0, 36.0, 43.0, 27.0, 28.0, 31.0, 21.0, 25.0, 11.0, 6.0, 11.0, 11.0, 6.0, 5.0, 4.0, 3.0, 5.0, 3.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0012369155883789062, -0.0012003332376480103, -0.0011637508869171143, -0.0011271685361862183, -0.0010905861854553223, -0.0010540038347244263, -0.0010174214839935303, -0.0009808391332626343, -0.0009442567825317383, -0.0009076744318008423, -0.0008710920810699463, -0.0008345097303390503, -0.0007979273796081543, -0.0007613450288772583, -0.0007247626781463623, -0.0006881803274154663, -0.0006515979766845703, -0.0006150156259536743, -0.0005784332752227783, -0.0005418509244918823, -0.0005052685737609863, -0.00046868622303009033, -0.00043210387229919434, -0.00039552152156829834, -0.00035893917083740234, -0.00032235682010650635, -0.00028577446937561035, -0.00024919211864471436, -0.00021260976791381836, -0.00017602741718292236, -0.00013944506645202637, -0.00010286271572113037, -6.628036499023438e-05, -2.969801425933838e-05, 6.884336471557617e-06, 4.346668720245361e-05, 8.004903793334961e-05, 0.0001166313886642456, 0.0001532137393951416, 0.0001897960901260376, 0.0002263784408569336, 0.0002629607915878296, 0.0002995431423187256, 0.0003361254930496216, 0.0003727078437805176, 0.0004092901945114136, 0.00044587254524230957, 0.00048245489597320557, 0.0005190372467041016, 0.0005556195974349976, 0.0005922019481658936, 0.0006287842988967896, 0.0006653666496276855, 0.0007019490003585815, 0.0007385313510894775, 0.0007751137018203735, 0.0008116960525512695, 0.0008482784032821655, 0.0008848607540130615, 0.0009214431047439575, 0.0009580254554748535, 0.0009946078062057495, 0.0010311901569366455, 0.0010677725076675415, 0.0011043548583984375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 3.0, 6.0, 6.0, 5.0, 5.0, 9.0, 6.0, 9.0, 20.0, 18.0, 29.0, 35.0, 47.0, 48.0, 75.0, 111.0, 138.0, 203.0, 269.0, 528.0, 1283.0, 614475.0, 428530.0, 1165.0, 480.0, 297.0, 168.0, 139.0, 88.0, 70.0, 58.0, 44.0, 36.0, 31.0, 23.0, 19.0, 10.0, 12.0, 12.0, 8.0, 7.0, 10.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0217437744140625, -0.0210416316986084, -0.020339488983154297, -0.019637346267700195, -0.018935203552246094, -0.018233060836791992, -0.01753091812133789, -0.01682877540588379, -0.016126632690429688, -0.015424489974975586, -0.014722347259521484, -0.014020204544067383, -0.013318061828613281, -0.01261591911315918, -0.011913776397705078, -0.011211633682250977, -0.010509490966796875, -0.009807348251342773, -0.009105205535888672, -0.00840306282043457, -0.007700920104980469, -0.006998777389526367, -0.006296634674072266, -0.005594491958618164, -0.0048923492431640625, -0.004190206527709961, -0.0034880638122558594, -0.002785921096801758, -0.0020837783813476562, -0.0013816356658935547, -0.0006794929504394531, 2.2649765014648438e-05, 0.00072479248046875, 0.0014269351959228516, 0.002129077911376953, 0.0028312206268310547, 0.0035333633422851562, 0.004235506057739258, 0.004937648773193359, 0.005639791488647461, 0.0063419342041015625, 0.007044076919555664, 0.007746219635009766, 0.008448362350463867, 0.009150505065917969, 0.00985264778137207, 0.010554790496826172, 0.011256933212280273, 0.011959075927734375, 0.012661218643188477, 0.013363361358642578, 0.01406550407409668, 0.014767646789550781, 0.015469789505004883, 0.016171932220458984, 0.016874074935913086, 0.017576217651367188, 0.01827836036682129, 0.01898050308227539, 0.019682645797729492, 0.020384788513183594, 0.021086931228637695, 0.021789073944091797, 0.0224912166595459, 0.023193359375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 93.0, 372.0, 412.0, 114.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030934158712625504, -0.0030024698935449123, -0.0029115239158272743, -0.0028205779381096363, -0.0027296319603919983, -0.0026386857498437166, -0.0025477397721260786, -0.0024567937944084406, -0.0023658478166908026, -0.0022749018389731646, -0.0021839558612555265, -0.0020930098835378885, -0.002002063672989607, -0.0019111178116872907, -0.0018201717175543308, -0.0017292257398366928, -0.0016382797621190548, -0.0015473337844014168, -0.0014563878066837788, -0.001365441712550819, -0.001274495734833181, -0.0011835497571155429, -0.001092603662982583, -0.001001657685264945, -0.000910711707547307, -0.000819765729829669, -0.0007288196939043701, -0.0006378736579790711, -0.0005469276802614331, -0.00045598167343996465, -0.0003650356666184962, -0.00027408963069319725, -0.00018314365297555923, -9.219764615409076e-05, -1.2516393326222897e-06, 8.969436748884618e-05, 0.00018064037431031466, 0.00027158638113178313, 0.0003625323879532516, 0.00045347842387855053, 0.0005444244015961885, 0.0006353703793138266, 0.0007263164152391255, 0.0008172624511644244, 0.0009082084288820624, 0.0009991544065997005, 0.0010901005007326603, 0.0011810464784502983, 0.0012719924561679363, 0.0013629384338855743, 0.0014538844116032124, 0.0015448305057361722, 0.0016357764834538102, 0.0017267224611714482, 0.001817668555304408, 0.001908614533022046, 0.001999560510739684, 0.002090506488457322, 0.00218145246617496, 0.002272398443892598, 0.00236334465444088, 0.002454290632158518, 0.002545236609876156, 0.002636182587593794, 0.002727128565311432]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 13.0, 11.0, 14.0, 15.0, 14.0, 19.0, 20.0, 27.0, 33.0, 32.0, 24.0, 44.0, 34.0, 37.0, 52.0, 49.0, 45.0, 34.0, 31.0, 42.0, 40.0, 44.0, 27.0, 32.0, 28.0, 34.0, 24.0, 17.0, 29.0, 23.0, 12.0, 18.0, 13.0, 14.0, 9.0, 6.0, 3.0, 3.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.000668644905090332, -0.0006485879421234131, -0.0006285309791564941, -0.0006084740161895752, -0.0005884170532226562, -0.0005683600902557373, -0.0005483031272888184, -0.0005282461643218994, -0.0005081892013549805, -0.0004881322383880615, -0.0004680752754211426, -0.00044801831245422363, -0.0004279613494873047, -0.00040790438652038574, -0.0003878474235534668, -0.00036779046058654785, -0.0003477334976196289, -0.00032767653465270996, -0.000307619571685791, -0.00028756260871887207, -0.0002675056457519531, -0.0002474486827850342, -0.00022739171981811523, -0.0002073347568511963, -0.00018727779388427734, -0.0001672208309173584, -0.00014716386795043945, -0.0001271069049835205, -0.00010704994201660156, -8.699297904968262e-05, -6.693601608276367e-05, -4.6879053115844727e-05, -2.682209014892578e-05, -6.765127182006836e-06, 1.329183578491211e-05, 3.3348798751831055e-05, 5.340576171875e-05, 7.346272468566895e-05, 9.351968765258789e-05, 0.00011357665061950684, 0.00013363361358642578, 0.00015369057655334473, 0.00017374753952026367, 0.00019380450248718262, 0.00021386146545410156, 0.0002339184284210205, 0.00025397539138793945, 0.0002740323543548584, 0.00029408931732177734, 0.0003141462802886963, 0.00033420324325561523, 0.0003542602062225342, 0.0003743171691894531, 0.00039437413215637207, 0.000414431095123291, 0.00043448805809020996, 0.0004545450210571289, 0.00047460198402404785, 0.0004946589469909668, 0.0005147159099578857, 0.0005347728729248047, 0.0005548298358917236, 0.0005748867988586426, 0.0005949437618255615, 0.0006150007247924805]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 2.0, 8.0, 4.0, 5.0, 8.0, 9.0, 9.0, 14.0, 14.0, 17.0, 18.0, 27.0, 24.0, 26.0, 28.0, 30.0, 29.0, 41.0, 26.0, 35.0, 44.0, 36.0, 47.0, 45.0, 38.0, 37.0, 41.0, 36.0, 25.0, 40.0, 24.0, 26.0, 25.0, 20.0, 29.0, 16.0, 20.0, 15.0, 13.0, 13.0, 11.0, 2.0, 5.0, 10.0, 5.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.3359375, -4.2042236328125, -4.072509765625, -3.9407958984375, -3.80908203125, -3.6773681640625, -3.545654296875, -3.4139404296875, -3.2822265625, -3.1505126953125, -3.018798828125, -2.8870849609375, -2.75537109375, -2.6236572265625, -2.491943359375, -2.3602294921875, -2.228515625, -2.0968017578125, -1.965087890625, -1.8333740234375, -1.70166015625, -1.5699462890625, -1.438232421875, -1.3065185546875, -1.1748046875, -1.0430908203125, -0.911376953125, -0.7796630859375, -0.64794921875, -0.5162353515625, -0.384521484375, -0.2528076171875, -0.12109375, 0.0106201171875, 0.142333984375, 0.2740478515625, 0.40576171875, 0.5374755859375, 0.669189453125, 0.8009033203125, 0.9326171875, 1.0643310546875, 1.196044921875, 1.3277587890625, 1.45947265625, 1.5911865234375, 1.722900390625, 1.8546142578125, 1.986328125, 2.1180419921875, 2.249755859375, 2.3814697265625, 2.51318359375, 2.6448974609375, 2.776611328125, 2.9083251953125, 3.0400390625, 3.1717529296875, 3.303466796875, 3.4351806640625, 3.56689453125, 3.6986083984375, 3.830322265625, 3.9620361328125, 4.09375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 14.0, 21.0, 23.0, 49.0, 55.0, 58.0, 114.0, 162.0, 226.0, 325.0, 465.0, 728.0, 1177.0, 2024.0, 3732.0, 7389.0, 16949.0, 48366.0, 176529.0, 490244.0, 207806.0, 55261.0, 19057.0, 7825.0, 3950.0, 2208.0, 1261.0, 837.0, 529.0, 374.0, 213.0, 180.0, 126.0, 70.0, 51.0, 38.0, 25.0, 30.0, 12.0, 7.0, 7.0, 4.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1875, -3.08319091796875, -2.9788818359375, -2.87457275390625, -2.770263671875, -2.66595458984375, -2.5616455078125, -2.45733642578125, -2.35302734375, -2.24871826171875, -2.1444091796875, -2.04010009765625, -1.935791015625, -1.83148193359375, -1.7271728515625, -1.62286376953125, -1.5185546875, -1.41424560546875, -1.3099365234375, -1.20562744140625, -1.101318359375, -0.99700927734375, -0.8927001953125, -0.78839111328125, -0.68408203125, -0.57977294921875, -0.4754638671875, -0.37115478515625, -0.266845703125, -0.16253662109375, -0.0582275390625, 0.04608154296875, 0.150390625, 0.25469970703125, 0.3590087890625, 0.46331787109375, 0.567626953125, 0.67193603515625, 0.7762451171875, 0.88055419921875, 0.98486328125, 1.08917236328125, 1.1934814453125, 1.29779052734375, 1.402099609375, 1.50640869140625, 1.6107177734375, 1.71502685546875, 1.8193359375, 1.92364501953125, 2.0279541015625, 2.13226318359375, 2.236572265625, 2.34088134765625, 2.4451904296875, 2.54949951171875, 2.65380859375, 2.75811767578125, 2.8624267578125, 2.96673583984375, 3.071044921875, 3.17535400390625, 3.2796630859375, 3.38397216796875, 3.48828125]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 7.0, 5.0, 8.0, 17.0, 8.0, 11.0, 14.0, 23.0, 23.0, 24.0, 25.0, 34.0, 33.0, 38.0, 48.0, 41.0, 52.0, 65.0, 1783.0, 298.0, 70.0, 39.0, 50.0, 43.0, 38.0, 44.0, 39.0, 40.0, 19.0, 18.0, 18.0, 14.0, 19.0, 11.0, 9.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.953125, -17.421875, -16.890625, -16.359375, -15.828125, -15.296875, -14.765625, -14.234375, -13.703125, -13.171875, -12.640625, -12.109375, -11.578125, -11.046875, -10.515625, -9.984375, -9.453125, -8.921875, -8.390625, -7.859375, -7.328125, -6.796875, -6.265625, -5.734375, -5.203125, -4.671875, -4.140625, -3.609375, -3.078125, -2.546875, -2.015625, -1.484375, -0.953125, -0.421875, 0.109375, 0.640625, 1.171875, 1.703125, 2.234375, 2.765625, 3.296875, 3.828125, 4.359375, 4.890625, 5.421875, 5.953125, 6.484375, 7.015625, 7.546875, 8.078125, 8.609375, 9.140625, 9.671875, 10.203125, 10.734375, 11.265625, 11.796875, 12.328125, 12.859375, 13.390625, 13.921875, 14.453125, 14.984375, 15.515625, 16.046875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 6.0, 8.0, 6.0, 15.0, 17.0, 17.0, 20.0, 21.0, 27.0, 38.0, 52.0, 65.0, 88.0, 151.0, 261.0, 527.0, 2311.0, 164811.0, 2970321.0, 5297.0, 733.0, 329.0, 161.0, 118.0, 63.0, 47.0, 35.0, 32.0, 20.0, 27.0, 16.0, 12.0, 12.0, 14.0, 6.0, 6.0, 9.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.109375, -25.243896484375, -24.37841796875, -23.512939453125, -22.6474609375, -21.781982421875, -20.91650390625, -20.051025390625, -19.185546875, -18.320068359375, -17.45458984375, -16.589111328125, -15.7236328125, -14.858154296875, -13.99267578125, -13.127197265625, -12.26171875, -11.396240234375, -10.53076171875, -9.665283203125, -8.7998046875, -7.934326171875, -7.06884765625, -6.203369140625, -5.337890625, -4.472412109375, -3.60693359375, -2.741455078125, -1.8759765625, -1.010498046875, -0.14501953125, 0.720458984375, 1.5859375, 2.451416015625, 3.31689453125, 4.182373046875, 5.0478515625, 5.913330078125, 6.77880859375, 7.644287109375, 8.509765625, 9.375244140625, 10.24072265625, 11.106201171875, 11.9716796875, 12.837158203125, 13.70263671875, 14.568115234375, 15.43359375, 16.299072265625, 17.16455078125, 18.030029296875, 18.8955078125, 19.760986328125, 20.62646484375, 21.491943359375, 22.357421875, 23.222900390625, 24.08837890625, 24.953857421875, 25.8193359375, 26.684814453125, 27.55029296875, 28.415771484375, 29.28125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 37.0, 343.0, 505.0, 113.0, 17.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.22747802734375, -23.57173728942871, -21.915996551513672, -20.260257720947266, -18.604516983032227, -16.948776245117188, -15.293035507202148, -13.637295722961426, -11.981554985046387, -10.325814247131348, -8.670074462890625, -7.014333724975586, -5.358593463897705, -3.702853202819824, -2.047112464904785, -0.3913726806640625, 1.2643680572509766, 2.9201083183288574, 4.575848579406738, 6.231589317321777, 7.887329578399658, 9.543069839477539, 11.198810577392578, 12.8545503616333, 14.51029109954834, 16.166030883789062, 17.8217716217041, 19.47751235961914, 21.13325309753418, 22.78899383544922, 24.444732666015625, 26.100473403930664, 27.756214141845703, 29.411954879760742, 31.06769561767578, 32.72343444824219, 34.37917709350586, 36.034915924072266, 37.69065856933594, 39.346397399902344, 41.00213623046875, 42.657875061035156, 44.31361770629883, 45.969356536865234, 47.625099182128906, 49.28083801269531, 50.93657684326172, 52.59231948852539, 54.24806213378906, 55.90380096435547, 57.55954360961914, 59.21528244018555, 60.87102508544922, 62.526763916015625, 64.18250274658203, 65.83824157714844, 67.49398040771484, 69.14971923828125, 70.80545806884766, 72.4612045288086, 74.116943359375, 75.7726821899414, 77.42842102050781, 79.08415985107422, 80.73990631103516]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 15.0, 9.0, 10.0, 17.0, 21.0, 17.0, 22.0, 27.0, 23.0, 32.0, 26.0, 31.0, 39.0, 36.0, 36.0, 36.0, 34.0, 42.0, 31.0, 46.0, 38.0, 32.0, 35.0, 35.0, 31.0, 34.0, 23.0, 16.0, 29.0, 18.0, 19.0, 15.0, 17.0, 16.0, 15.0, 12.0, 4.0, 10.0, 3.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-44.937191009521484, -43.51692581176758, -42.09666442871094, -40.67639923095703, -39.256134033203125, -37.835872650146484, -36.41560745239258, -34.99534606933594, -33.57508087158203, -32.154815673828125, -30.734554290771484, -29.314289093017578, -27.894025802612305, -26.47376251220703, -25.053497314453125, -23.63323402404785, -22.212970733642578, -20.792707443237305, -19.37244415283203, -17.952178955078125, -16.53191566467285, -15.111652374267578, -13.691388130187988, -12.271123886108398, -10.850860595703125, -9.430597305297852, -8.010333061218262, -6.59006929397583, -5.169805526733398, -3.749541759490967, -2.329277992248535, -0.9090137481689453, 0.5112533569335938, 1.9315171241760254, 3.351780891418457, 4.772044658660889, 6.19230842590332, 7.612572193145752, 9.032835960388184, 10.453100204467773, 11.873363494873047, 13.29362678527832, 14.71389102935791, 16.1341552734375, 17.554418563842773, 18.974681854248047, 20.394947052001953, 21.815210342407227, 23.2354736328125, 24.655736923217773, 26.076000213623047, 27.496265411376953, 28.916528701782227, 30.3367919921875, 31.757057189941406, 33.17732238769531, 34.59758377075195, 36.01784896850586, 37.4381103515625, 38.858375549316406, 40.27864074707031, 41.69890213012695, 43.11916732788086, 44.5394287109375, 45.959693908691406]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 3.0, 7.0, 2.0, 11.0, 9.0, 9.0, 13.0, 12.0, 20.0, 23.0, 16.0, 29.0, 19.0, 26.0, 32.0, 31.0, 33.0, 39.0, 31.0, 42.0, 39.0, 42.0, 41.0, 44.0, 44.0, 32.0, 31.0, 36.0, 40.0, 29.0, 23.0, 21.0, 21.0, 28.0, 24.0, 17.0, 14.0, 8.0, 19.0, 5.0, 8.0, 5.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.421875, -4.2882080078125, -4.154541015625, -4.0208740234375, -3.88720703125, -3.7535400390625, -3.619873046875, -3.4862060546875, -3.3525390625, -3.2188720703125, -3.085205078125, -2.9515380859375, -2.81787109375, -2.6842041015625, -2.550537109375, -2.4168701171875, -2.283203125, -2.1495361328125, -2.015869140625, -1.8822021484375, -1.74853515625, -1.6148681640625, -1.481201171875, -1.3475341796875, -1.2138671875, -1.0802001953125, -0.946533203125, -0.8128662109375, -0.67919921875, -0.5455322265625, -0.411865234375, -0.2781982421875, -0.14453125, -0.0108642578125, 0.122802734375, 0.2564697265625, 0.39013671875, 0.5238037109375, 0.657470703125, 0.7911376953125, 0.9248046875, 1.0584716796875, 1.192138671875, 1.3258056640625, 1.45947265625, 1.5931396484375, 1.726806640625, 1.8604736328125, 1.994140625, 2.1278076171875, 2.261474609375, 2.3951416015625, 2.52880859375, 2.6624755859375, 2.796142578125, 2.9298095703125, 3.0634765625, 3.1971435546875, 3.330810546875, 3.4644775390625, 3.59814453125, 3.7318115234375, 3.865478515625, 3.9991455078125, 4.1328125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 9.0, 9.0, 8.0, 9.0, 17.0, 26.0, 30.0, 38.0, 62.0, 100.0, 164.0, 341.0, 679.0, 1995.0, 7549.0, 40139.0, 339063.0, 2208415.0, 1410659.0, 155357.0, 22214.0, 4690.0, 1476.0, 537.0, 255.0, 143.0, 102.0, 46.0, 34.0, 24.0, 22.0, 17.0, 13.0, 8.0, 9.0, 5.0, 4.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.796875, -10.468017578125, -10.13916015625, -9.810302734375, -9.4814453125, -9.152587890625, -8.82373046875, -8.494873046875, -8.166015625, -7.837158203125, -7.50830078125, -7.179443359375, -6.8505859375, -6.521728515625, -6.19287109375, -5.864013671875, -5.53515625, -5.206298828125, -4.87744140625, -4.548583984375, -4.2197265625, -3.890869140625, -3.56201171875, -3.233154296875, -2.904296875, -2.575439453125, -2.24658203125, -1.917724609375, -1.5888671875, -1.260009765625, -0.93115234375, -0.602294921875, -0.2734375, 0.055419921875, 0.38427734375, 0.713134765625, 1.0419921875, 1.370849609375, 1.69970703125, 2.028564453125, 2.357421875, 2.686279296875, 3.01513671875, 3.343994140625, 3.6728515625, 4.001708984375, 4.33056640625, 4.659423828125, 4.98828125, 5.317138671875, 5.64599609375, 5.974853515625, 6.3037109375, 6.632568359375, 6.96142578125, 7.290283203125, 7.619140625, 7.947998046875, 8.27685546875, 8.605712890625, 8.9345703125, 9.263427734375, 9.59228515625, 9.921142578125, 10.25]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 6.0, 7.0, 8.0, 21.0, 27.0, 31.0, 23.0, 45.0, 53.0, 80.0, 107.0, 130.0, 182.0, 211.0, 269.0, 317.0, 359.0, 370.0, 364.0, 299.0, 262.0, 206.0, 153.0, 118.0, 82.0, 69.0, 72.0, 48.0, 35.0, 27.0, 25.0, 18.0, 8.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-11.8046875, -11.4886474609375, -11.172607421875, -10.8565673828125, -10.54052734375, -10.2244873046875, -9.908447265625, -9.5924072265625, -9.2763671875, -8.9603271484375, -8.644287109375, -8.3282470703125, -8.01220703125, -7.6961669921875, -7.380126953125, -7.0640869140625, -6.748046875, -6.4320068359375, -6.115966796875, -5.7999267578125, -5.48388671875, -5.1678466796875, -4.851806640625, -4.5357666015625, -4.2197265625, -3.9036865234375, -3.587646484375, -3.2716064453125, -2.95556640625, -2.6395263671875, -2.323486328125, -2.0074462890625, -1.69140625, -1.3753662109375, -1.059326171875, -0.7432861328125, -0.42724609375, -0.1112060546875, 0.204833984375, 0.5208740234375, 0.8369140625, 1.1529541015625, 1.468994140625, 1.7850341796875, 2.10107421875, 2.4171142578125, 2.733154296875, 3.0491943359375, 3.365234375, 3.6812744140625, 3.997314453125, 4.3133544921875, 4.62939453125, 4.9454345703125, 5.261474609375, 5.5775146484375, 5.8935546875, 6.2095947265625, 6.525634765625, 6.8416748046875, 7.15771484375, 7.4737548828125, 7.789794921875, 8.1058349609375, 8.421875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 14.0, 7.0, 14.0, 12.0, 31.0, 42.0, 64.0, 66.0, 130.0, 168.0, 330.0, 1039.0, 9665.0, 764386.0, 3383043.0, 32424.0, 1812.0, 419.0, 195.0, 125.0, 80.0, 52.0, 36.0, 39.0, 20.0, 16.0, 12.0, 9.0, 5.0, 5.0, 9.0, 1.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.0, -34.62451171875, -33.2490234375, -31.87353515625, -30.498046875, -29.12255859375, -27.7470703125, -26.37158203125, -24.99609375, -23.62060546875, -22.2451171875, -20.86962890625, -19.494140625, -18.11865234375, -16.7431640625, -15.36767578125, -13.9921875, -12.61669921875, -11.2412109375, -9.86572265625, -8.490234375, -7.11474609375, -5.7392578125, -4.36376953125, -2.98828125, -1.61279296875, -0.2373046875, 1.13818359375, 2.513671875, 3.88916015625, 5.2646484375, 6.64013671875, 8.015625, 9.39111328125, 10.7666015625, 12.14208984375, 13.517578125, 14.89306640625, 16.2685546875, 17.64404296875, 19.01953125, 20.39501953125, 21.7705078125, 23.14599609375, 24.521484375, 25.89697265625, 27.2724609375, 28.64794921875, 30.0234375, 31.39892578125, 32.7744140625, 34.14990234375, 35.525390625, 36.90087890625, 38.2763671875, 39.65185546875, 41.02734375, 42.40283203125, 43.7783203125, 45.15380859375, 46.529296875, 47.90478515625, 49.2802734375, 50.65576171875, 52.03125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 28.0, 146.0, 265.0, 308.0, 201.0, 52.0, 8.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-165.12496948242188, -160.6858367919922, -156.24668884277344, -151.80755615234375, -147.36842346191406, -142.9292755126953, -138.49014282226562, -134.05101013183594, -129.6118621826172, -125.17272186279297, -120.73358917236328, -116.29444885253906, -111.85530853271484, -107.41616821289062, -102.97703552246094, -98.53789520263672, -94.09876251220703, -89.65962219238281, -85.22048950195312, -80.7813491821289, -76.34220886230469, -71.903076171875, -67.46393585205078, -63.02479553222656, -58.58565902709961, -54.146522521972656, -49.70738220214844, -45.268245697021484, -40.82910919189453, -36.38996887207031, -31.95083236694336, -27.511693954467773, -23.072547912597656, -18.63340950012207, -14.1942720413208, -9.755134582519531, -5.315996170043945, -0.8768577575683594, 3.5622787475585938, 8.00141716003418, 12.440555572509766, 16.87969398498535, 21.318832397460938, 25.75796890258789, 30.197107315063477, 34.63624572753906, 39.075382232666016, 43.51451873779297, 47.95365905761719, 52.39279556274414, 56.83193588256836, 61.27107238769531, 65.71021270751953, 70.14935302734375, 74.58848571777344, 79.02762603759766, 83.46676635742188, 87.9059066772461, 92.34503936767578, 96.7841796875, 101.22332000732422, 105.66246032714844, 110.10159301757812, 114.54073333740234, 118.97986602783203]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 6.0, 4.0, 10.0, 4.0, 19.0, 10.0, 11.0, 11.0, 26.0, 20.0, 21.0, 23.0, 32.0, 31.0, 38.0, 42.0, 44.0, 40.0, 38.0, 39.0, 43.0, 34.0, 39.0, 34.0, 49.0, 38.0, 23.0, 31.0, 31.0, 28.0, 24.0, 25.0, 21.0, 19.0, 9.0, 10.0, 15.0, 14.0, 10.0, 7.0, 4.0, 8.0, 8.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-38.221527099609375, -37.04113006591797, -35.86073684692383, -34.68033981323242, -33.499942779541016, -32.319549560546875, -31.13915252685547, -29.958755493164062, -28.77836036682129, -27.597965240478516, -26.41756820678711, -25.237173080444336, -24.056777954101562, -22.876380920410156, -21.695985794067383, -20.51559066772461, -19.335193634033203, -18.15479850769043, -16.974401473999023, -15.79400634765625, -14.61361026763916, -13.43321418762207, -12.252819061279297, -11.072422981262207, -9.892026901245117, -8.711630821228027, -7.531235218048096, -6.350839614868164, -5.170443534851074, -3.9900474548339844, -2.8096518516540527, -1.629256248474121, -0.44886016845703125, 0.7315356731414795, 1.9119315147399902, 3.092327356338501, 4.272723197937012, 5.453119277954102, 6.633514881134033, 7.813910484313965, 8.994306564331055, 10.174702644348145, 11.355098724365234, 12.535493850708008, 13.715889930725098, 14.896286010742188, 16.07668113708496, 17.257076263427734, 18.43747329711914, 19.617868423461914, 20.79826545715332, 21.978660583496094, 23.1590576171875, 24.339452743530273, 25.519847869873047, 26.700244903564453, 27.880640029907227, 29.06103515625, 30.241432189941406, 31.42182731628418, 32.60222244262695, 33.78261947631836, 34.963016510009766, 36.143409729003906, 37.32380676269531]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 3.0, 7.0, 9.0, 4.0, 11.0, 8.0, 16.0, 12.0, 15.0, 18.0, 22.0, 23.0, 36.0, 24.0, 28.0, 46.0, 40.0, 33.0, 32.0, 42.0, 58.0, 43.0, 41.0, 34.0, 44.0, 37.0, 29.0, 29.0, 30.0, 26.0, 24.0, 23.0, 22.0, 20.0, 22.0, 11.0, 10.0, 10.0, 10.0, 8.0, 12.0, 13.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.640625, -4.5008544921875, -4.361083984375, -4.2213134765625, -4.08154296875, -3.9417724609375, -3.802001953125, -3.6622314453125, -3.5224609375, -3.3826904296875, -3.242919921875, -3.1031494140625, -2.96337890625, -2.8236083984375, -2.683837890625, -2.5440673828125, -2.404296875, -2.2645263671875, -2.124755859375, -1.9849853515625, -1.84521484375, -1.7054443359375, -1.565673828125, -1.4259033203125, -1.2861328125, -1.1463623046875, -1.006591796875, -0.8668212890625, -0.72705078125, -0.5872802734375, -0.447509765625, -0.3077392578125, -0.16796875, -0.0281982421875, 0.111572265625, 0.2513427734375, 0.39111328125, 0.5308837890625, 0.670654296875, 0.8104248046875, 0.9501953125, 1.0899658203125, 1.229736328125, 1.3695068359375, 1.50927734375, 1.6490478515625, 1.788818359375, 1.9285888671875, 2.068359375, 2.2081298828125, 2.347900390625, 2.4876708984375, 2.62744140625, 2.7672119140625, 2.906982421875, 3.0467529296875, 3.1865234375, 3.3262939453125, 3.466064453125, 3.6058349609375, 3.74560546875, 3.8853759765625, 4.025146484375, 4.1649169921875, 4.3046875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 6.0, 9.0, 14.0, 18.0, 21.0, 20.0, 26.0, 65.0, 89.0, 106.0, 186.0, 247.0, 326.0, 452.0, 722.0, 1016.0, 1524.0, 2158.0, 3312.0, 4830.0, 7255.0, 10757.0, 16251.0, 25004.0, 38871.0, 59949.0, 97544.0, 154076.0, 197315.0, 154851.0, 97840.0, 60066.0, 38912.0, 24992.0, 16407.0, 10901.0, 7199.0, 4749.0, 3292.0, 2218.0, 1525.0, 1083.0, 713.0, 530.0, 345.0, 238.0, 169.0, 105.0, 80.0, 56.0, 43.0, 31.0, 20.0, 8.0, 9.0, 7.0, 7.0, 1.0, 3.0, 2.0], "bins": [-0.53515625, -0.5186920166015625, -0.502227783203125, -0.4857635498046875, -0.46929931640625, -0.4528350830078125, -0.436370849609375, -0.4199066162109375, -0.4034423828125, -0.3869781494140625, -0.370513916015625, -0.3540496826171875, -0.33758544921875, -0.3211212158203125, -0.304656982421875, -0.2881927490234375, -0.271728515625, -0.2552642822265625, -0.238800048828125, -0.2223358154296875, -0.20587158203125, -0.1894073486328125, -0.172943115234375, -0.1564788818359375, -0.1400146484375, -0.1235504150390625, -0.107086181640625, -0.0906219482421875, -0.07415771484375, -0.0576934814453125, -0.041229248046875, -0.0247650146484375, -0.00830078125, 0.0081634521484375, 0.024627685546875, 0.0410919189453125, 0.05755615234375, 0.0740203857421875, 0.090484619140625, 0.1069488525390625, 0.1234130859375, 0.1398773193359375, 0.156341552734375, 0.1728057861328125, 0.18927001953125, 0.2057342529296875, 0.222198486328125, 0.2386627197265625, 0.255126953125, 0.2715911865234375, 0.288055419921875, 0.3045196533203125, 0.32098388671875, 0.3374481201171875, 0.353912353515625, 0.3703765869140625, 0.3868408203125, 0.4033050537109375, 0.419769287109375, 0.4362335205078125, 0.45269775390625, 0.4691619873046875, 0.485626220703125, 0.5020904541015625, 0.5185546875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 10.0, 9.0, 13.0, 19.0, 20.0, 26.0, 27.0, 21.0, 31.0, 35.0, 34.0, 37.0, 43.0, 42.0, 36.0, 46.0, 1071.0, 46.0, 41.0, 49.0, 32.0, 43.0, 37.0, 38.0, 32.0, 27.0, 23.0, 24.0, 16.0, 13.0, 14.0, 10.0, 16.0, 7.0, 9.0, 5.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.15234375, -3.04937744140625, -2.9464111328125, -2.84344482421875, -2.740478515625, -2.63751220703125, -2.5345458984375, -2.43157958984375, -2.32861328125, -2.22564697265625, -2.1226806640625, -2.01971435546875, -1.916748046875, -1.81378173828125, -1.7108154296875, -1.60784912109375, -1.5048828125, -1.40191650390625, -1.2989501953125, -1.19598388671875, -1.093017578125, -0.99005126953125, -0.8870849609375, -0.78411865234375, -0.68115234375, -0.57818603515625, -0.4752197265625, -0.37225341796875, -0.269287109375, -0.16632080078125, -0.0633544921875, 0.03961181640625, 0.142578125, 0.24554443359375, 0.3485107421875, 0.45147705078125, 0.554443359375, 0.65740966796875, 0.7603759765625, 0.86334228515625, 0.96630859375, 1.06927490234375, 1.1722412109375, 1.27520751953125, 1.378173828125, 1.48114013671875, 1.5841064453125, 1.68707275390625, 1.7900390625, 1.89300537109375, 1.9959716796875, 2.09893798828125, 2.201904296875, 2.30487060546875, 2.4078369140625, 2.51080322265625, 2.61376953125, 2.71673583984375, 2.8197021484375, 2.92266845703125, 3.025634765625, 3.12860107421875, 3.2315673828125, 3.33453369140625, 3.4375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 8.0, 10.0, 19.0, 33.0, 31.0, 55.0, 67.0, 104.0, 189.0, 309.0, 446.0, 724.0, 1190.0, 1944.0, 3050.0, 4738.0, 7861.0, 12707.0, 21206.0, 36084.0, 64420.0, 118822.0, 204805.0, 1278342.0, 148982.0, 80959.0, 44492.0, 25725.0, 15113.0, 9330.0, 5682.0, 3624.0, 2266.0, 1422.0, 840.0, 559.0, 348.0, 216.0, 150.0, 99.0, 53.0, 34.0, 26.0, 20.0, 3.0, 13.0, 6.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.587890625, -0.5701751708984375, -0.552459716796875, -0.5347442626953125, -0.51702880859375, -0.4993133544921875, -0.481597900390625, -0.4638824462890625, -0.4461669921875, -0.4284515380859375, -0.410736083984375, -0.3930206298828125, -0.37530517578125, -0.3575897216796875, -0.339874267578125, -0.3221588134765625, -0.304443359375, -0.2867279052734375, -0.269012451171875, -0.2512969970703125, -0.23358154296875, -0.2158660888671875, -0.198150634765625, -0.1804351806640625, -0.1627197265625, -0.1450042724609375, -0.127288818359375, -0.1095733642578125, -0.09185791015625, -0.0741424560546875, -0.056427001953125, -0.0387115478515625, -0.02099609375, -0.0032806396484375, 0.014434814453125, 0.0321502685546875, 0.04986572265625, 0.0675811767578125, 0.085296630859375, 0.1030120849609375, 0.1207275390625, 0.1384429931640625, 0.156158447265625, 0.1738739013671875, 0.19158935546875, 0.2093048095703125, 0.227020263671875, 0.2447357177734375, 0.262451171875, 0.2801666259765625, 0.297882080078125, 0.3155975341796875, 0.33331298828125, 0.3510284423828125, 0.368743896484375, 0.3864593505859375, 0.4041748046875, 0.4218902587890625, 0.439605712890625, 0.4573211669921875, 0.47503662109375, 0.4927520751953125, 0.510467529296875, 0.5281829833984375, 0.5458984375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 4.0, 0.0, 6.0, 4.0, 7.0, 13.0, 11.0, 15.0, 16.0, 20.0, 23.0, 34.0, 41.0, 33.0, 46.0, 64.0, 51.0, 52.0, 57.0, 45.0, 55.0, 47.0, 41.0, 39.0, 45.0, 40.0, 44.0, 29.0, 19.0, 18.0, 17.0, 18.0, 11.0, 11.0, 4.0, 2.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014047622680664062, -0.0013611167669296265, -0.0013174712657928467, -0.001273825764656067, -0.0012301802635192871, -0.0011865347623825073, -0.0011428892612457275, -0.0010992437601089478, -0.001055598258972168, -0.0010119527578353882, -0.0009683072566986084, -0.0009246617555618286, -0.0008810162544250488, -0.000837370753288269, -0.0007937252521514893, -0.0007500797510147095, -0.0007064342498779297, -0.0006627887487411499, -0.0006191432476043701, -0.0005754977464675903, -0.0005318522453308105, -0.00048820674419403076, -0.000444561243057251, -0.0004009157419204712, -0.0003572702407836914, -0.0003136247396469116, -0.00026997923851013184, -0.00022633373737335205, -0.00018268823623657227, -0.00013904273509979248, -9.53972339630127e-05, -5.175173282623291e-05, -8.106231689453125e-06, 3.553926944732666e-05, 7.918477058410645e-05, 0.00012283027172088623, 0.00016647577285766602, 0.0002101212739944458, 0.0002537667751312256, 0.00029741227626800537, 0.00034105777740478516, 0.00038470327854156494, 0.0004283487796783447, 0.0004719942808151245, 0.0005156397819519043, 0.0005592852830886841, 0.0006029307842254639, 0.0006465762853622437, 0.0006902217864990234, 0.0007338672876358032, 0.000777512788772583, 0.0008211582899093628, 0.0008648037910461426, 0.0009084492921829224, 0.0009520947933197021, 0.000995740294456482, 0.0010393857955932617, 0.0010830312967300415, 0.0011266767978668213, 0.001170322299003601, 0.0012139678001403809, 0.0012576133012771606, 0.0013012588024139404, 0.0013449043035507202, 0.0013885498046875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 9.0, 8.0, 9.0, 16.0, 28.0, 14.0, 24.0, 23.0, 35.0, 48.0, 84.0, 110.0, 150.0, 243.0, 456.0, 1153.0, 827433.0, 216680.0, 878.0, 399.0, 244.0, 131.0, 84.0, 62.0, 49.0, 43.0, 20.0, 20.0, 11.0, 18.0, 12.0, 14.0, 9.0, 5.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0302276611328125, -0.02928018569946289, -0.02833271026611328, -0.027385234832763672, -0.026437759399414062, -0.025490283966064453, -0.024542808532714844, -0.023595333099365234, -0.022647857666015625, -0.021700382232666016, -0.020752906799316406, -0.019805431365966797, -0.018857955932617188, -0.017910480499267578, -0.01696300506591797, -0.01601552963256836, -0.01506805419921875, -0.01412057876586914, -0.013173103332519531, -0.012225627899169922, -0.011278152465820312, -0.010330677032470703, -0.009383201599121094, -0.008435726165771484, -0.007488250732421875, -0.006540775299072266, -0.005593299865722656, -0.004645824432373047, -0.0036983489990234375, -0.002750873565673828, -0.0018033981323242188, -0.0008559226989746094, 9.1552734375e-05, 0.0010390281677246094, 0.0019865036010742188, 0.002933979034423828, 0.0038814544677734375, 0.004828929901123047, 0.005776405334472656, 0.006723880767822266, 0.007671356201171875, 0.008618831634521484, 0.009566307067871094, 0.010513782501220703, 0.011461257934570312, 0.012408733367919922, 0.013356208801269531, 0.01430368423461914, 0.01525115966796875, 0.01619863510131836, 0.01714611053466797, 0.018093585968017578, 0.019041061401367188, 0.019988536834716797, 0.020936012268066406, 0.021883487701416016, 0.022830963134765625, 0.023778438568115234, 0.024725914001464844, 0.025673389434814453, 0.026620864868164062, 0.027568340301513672, 0.02851581573486328, 0.02946329116821289, 0.0304107666015625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 121.0, 815.0, 79.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.01166532188653946, -0.011465760879218578, -0.011266199871897697, -0.011066637933254242, -0.010867076925933361, -0.01066751591861248, -0.0104679549112916, -0.010268393903970718, -0.010068831965327263, -0.009869270958006382, -0.009669709950685501, -0.009470148012042046, -0.009270587004721165, -0.009071025997400284, -0.008871464990079403, -0.008671903982758522, -0.008472342975437641, -0.00827278196811676, -0.00807322096079588, -0.007873659022152424, -0.007674098014831543, -0.007474537007510662, -0.007274976000189781, -0.0070754149928689, -0.006875853519886732, -0.006676292512565851, -0.006476731039583683, -0.006277170032262802, -0.006077609024941921, -0.005878047551959753, -0.005678486544638872, -0.005478925071656704, -0.005279363598674536, -0.005079802591353655, -0.004880241118371487, -0.004680680111050606, -0.004481119103729725, -0.004281557630747557, -0.004081996623426676, -0.0038824353832751513, -0.0036828741431236267, -0.003483312902972102, -0.0032837516628205776, -0.0030841906554996967, -0.002884629415348172, -0.0026850681751966476, -0.0024855071678757668, -0.002285945927724242, -0.0020863846875727177, -0.0018868234474211931, -0.0016872623236849904, -0.0014877011999487877, -0.0012881399597972631, -0.0010885787196457386, -0.0008890175959095359, -0.0006894564721733332, -0.0004898953484371305, -0.0002903341664932668, -9.077298454940319e-05, 0.00010878819739446044, 0.00030834937933832407, 0.0005079106194898486, 0.0007074717432260513, 0.000907032866962254, 0.0011065941071137786]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 9.0, 8.0, 6.0, 7.0, 12.0, 8.0, 12.0, 13.0, 17.0, 19.0, 17.0, 24.0, 21.0, 29.0, 39.0, 37.0, 32.0, 25.0, 42.0, 39.0, 52.0, 25.0, 37.0, 36.0, 36.0, 42.0, 25.0, 37.0, 32.0, 30.0, 36.0, 24.0, 17.0, 18.0, 20.0, 16.0, 12.0, 14.0, 15.0, 15.0, 9.0, 8.0, 9.0, 7.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.000741422176361084, -0.0007203370332717896, -0.0006992518901824951, -0.0006781667470932007, -0.0006570816040039062, -0.0006359964609146118, -0.0006149113178253174, -0.000593826174736023, -0.0005727410316467285, -0.0005516558885574341, -0.0005305707454681396, -0.0005094856023788452, -0.0004884004592895508, -0.00046731531620025635, -0.0004462301731109619, -0.0004251450300216675, -0.00040405988693237305, -0.0003829747438430786, -0.0003618896007537842, -0.00034080445766448975, -0.0003197193145751953, -0.0002986341714859009, -0.00027754902839660645, -0.000256463885307312, -0.00023537874221801758, -0.00021429359912872314, -0.0001932084560394287, -0.00017212331295013428, -0.00015103816986083984, -0.0001299530267715454, -0.00010886788368225098, -8.778274059295654e-05, -6.669759750366211e-05, -4.5612454414367676e-05, -2.4527311325073242e-05, -3.4421682357788086e-06, 1.7642974853515625e-05, 3.872811794281006e-05, 5.981326103210449e-05, 8.089840412139893e-05, 0.00010198354721069336, 0.0001230686902999878, 0.00014415383338928223, 0.00016523897647857666, 0.0001863241195678711, 0.00020740926265716553, 0.00022849440574645996, 0.0002495795488357544, 0.00027066469192504883, 0.00029174983501434326, 0.0003128349781036377, 0.00033392012119293213, 0.00035500526428222656, 0.000376090407371521, 0.00039717555046081543, 0.00041826069355010986, 0.0004393458366394043, 0.00046043097972869873, 0.00048151612281799316, 0.0005026012659072876, 0.000523686408996582, 0.0005447715520858765, 0.0005658566951751709, 0.0005869418382644653, 0.0006080269813537598]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 3.0, 7.0, 9.0, 4.0, 11.0, 8.0, 16.0, 12.0, 15.0, 18.0, 22.0, 23.0, 35.0, 25.0, 28.0, 46.0, 40.0, 33.0, 32.0, 42.0, 58.0, 43.0, 41.0, 34.0, 44.0, 37.0, 29.0, 28.0, 31.0, 26.0, 24.0, 23.0, 22.0, 20.0, 22.0, 11.0, 10.0, 10.0, 10.0, 8.0, 12.0, 13.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.640625, -4.5008544921875, -4.361083984375, -4.2213134765625, -4.08154296875, -3.9417724609375, -3.802001953125, -3.6622314453125, -3.5224609375, -3.3826904296875, -3.242919921875, -3.1031494140625, -2.96337890625, -2.8236083984375, -2.683837890625, -2.5440673828125, -2.404296875, -2.2645263671875, -2.124755859375, -1.9849853515625, -1.84521484375, -1.7054443359375, -1.565673828125, -1.4259033203125, -1.2861328125, -1.1463623046875, -1.006591796875, -0.8668212890625, -0.72705078125, -0.5872802734375, -0.447509765625, -0.3077392578125, -0.16796875, -0.0281982421875, 0.111572265625, 0.2513427734375, 0.39111328125, 0.5308837890625, 0.670654296875, 0.8104248046875, 0.9501953125, 1.0899658203125, 1.229736328125, 1.3695068359375, 1.50927734375, 1.6490478515625, 1.788818359375, 1.9285888671875, 2.068359375, 2.2081298828125, 2.347900390625, 2.4876708984375, 2.62744140625, 2.7672119140625, 2.906982421875, 3.0467529296875, 3.1865234375, 3.3262939453125, 3.466064453125, 3.6058349609375, 3.74560546875, 3.8853759765625, 4.025146484375, 4.1649169921875, 4.3046875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 4.0, 9.0, 8.0, 15.0, 18.0, 23.0, 18.0, 50.0, 73.0, 119.0, 221.0, 414.0, 825.0, 1629.0, 3108.0, 6584.0, 14372.0, 34755.0, 97012.0, 295210.0, 380444.0, 133272.0, 46261.0, 18146.0, 7997.0, 3816.0, 1931.0, 976.0, 532.0, 281.0, 131.0, 96.0, 54.0, 35.0, 18.0, 19.0, 10.0, 9.0, 16.0, 4.0, 10.0, 9.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.919921875, -2.831817626953125, -2.74371337890625, -2.655609130859375, -2.5675048828125, -2.479400634765625, -2.39129638671875, -2.303192138671875, -2.215087890625, -2.126983642578125, -2.03887939453125, -1.950775146484375, -1.8626708984375, -1.774566650390625, -1.68646240234375, -1.598358154296875, -1.51025390625, -1.422149658203125, -1.33404541015625, -1.245941162109375, -1.1578369140625, -1.069732666015625, -0.98162841796875, -0.893524169921875, -0.805419921875, -0.717315673828125, -0.62921142578125, -0.541107177734375, -0.4530029296875, -0.364898681640625, -0.27679443359375, -0.188690185546875, -0.1005859375, -0.012481689453125, 0.07562255859375, 0.163726806640625, 0.2518310546875, 0.339935302734375, 0.42803955078125, 0.516143798828125, 0.604248046875, 0.692352294921875, 0.78045654296875, 0.868560791015625, 0.9566650390625, 1.044769287109375, 1.13287353515625, 1.220977783203125, 1.30908203125, 1.397186279296875, 1.48529052734375, 1.573394775390625, 1.6614990234375, 1.749603271484375, 1.83770751953125, 1.925811767578125, 2.013916015625, 2.102020263671875, 2.19012451171875, 2.278228759765625, 2.3663330078125, 2.454437255859375, 2.54254150390625, 2.630645751953125, 2.71875]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 2.0, 5.0, 6.0, 4.0, 6.0, 2.0, 9.0, 15.0, 14.0, 25.0, 24.0, 16.0, 22.0, 28.0, 35.0, 45.0, 47.0, 46.0, 60.0, 92.0, 210.0, 1701.0, 160.0, 82.0, 37.0, 45.0, 40.0, 38.0, 32.0, 34.0, 24.0, 22.0, 28.0, 18.0, 19.0, 12.0, 11.0, 9.0, 6.0, 6.0, 7.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.921875, -16.364990234375, -15.80810546875, -15.251220703125, -14.6943359375, -14.137451171875, -13.58056640625, -13.023681640625, -12.466796875, -11.909912109375, -11.35302734375, -10.796142578125, -10.2392578125, -9.682373046875, -9.12548828125, -8.568603515625, -8.01171875, -7.454833984375, -6.89794921875, -6.341064453125, -5.7841796875, -5.227294921875, -4.67041015625, -4.113525390625, -3.556640625, -2.999755859375, -2.44287109375, -1.885986328125, -1.3291015625, -0.772216796875, -0.21533203125, 0.341552734375, 0.8984375, 1.455322265625, 2.01220703125, 2.569091796875, 3.1259765625, 3.682861328125, 4.23974609375, 4.796630859375, 5.353515625, 5.910400390625, 6.46728515625, 7.024169921875, 7.5810546875, 8.137939453125, 8.69482421875, 9.251708984375, 9.80859375, 10.365478515625, 10.92236328125, 11.479248046875, 12.0361328125, 12.593017578125, 13.14990234375, 13.706787109375, 14.263671875, 14.820556640625, 15.37744140625, 15.934326171875, 16.4912109375, 17.048095703125, 17.60498046875, 18.161865234375, 18.71875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 10.0, 7.0, 8.0, 10.0, 12.0, 15.0, 18.0, 29.0, 30.0, 30.0, 52.0, 40.0, 92.0, 133.0, 202.0, 351.0, 904.0, 5116.0, 2566620.0, 566707.0, 3555.0, 807.0, 330.0, 194.0, 106.0, 73.0, 65.0, 32.0, 24.0, 25.0, 28.0, 22.0, 15.0, 7.0, 4.0, 5.0, 6.0, 3.0, 7.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.8125, -29.876708984375, -28.94091796875, -28.005126953125, -27.0693359375, -26.133544921875, -25.19775390625, -24.261962890625, -23.326171875, -22.390380859375, -21.45458984375, -20.518798828125, -19.5830078125, -18.647216796875, -17.71142578125, -16.775634765625, -15.83984375, -14.904052734375, -13.96826171875, -13.032470703125, -12.0966796875, -11.160888671875, -10.22509765625, -9.289306640625, -8.353515625, -7.417724609375, -6.48193359375, -5.546142578125, -4.6103515625, -3.674560546875, -2.73876953125, -1.802978515625, -0.8671875, 0.068603515625, 1.00439453125, 1.940185546875, 2.8759765625, 3.811767578125, 4.74755859375, 5.683349609375, 6.619140625, 7.554931640625, 8.49072265625, 9.426513671875, 10.3623046875, 11.298095703125, 12.23388671875, 13.169677734375, 14.10546875, 15.041259765625, 15.97705078125, 16.912841796875, 17.8486328125, 18.784423828125, 19.72021484375, 20.656005859375, 21.591796875, 22.527587890625, 23.46337890625, 24.399169921875, 25.3349609375, 26.270751953125, 27.20654296875, 28.142333984375, 29.078125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [6.0, 39.0, 165.0, 440.0, 270.0, 85.0, 8.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.939155101776123, -4.361083507537842, -2.7830116748809814, -1.204939842224121, 0.37313175201416016, 1.9512033462524414, 3.529275417327881, 5.107347011566162, 6.685418605804443, 8.263490676879883, 9.841562271118164, 11.419633865356445, 12.997705459594727, 14.575777053833008, 16.15384864807129, 17.73192024230957, 19.30999183654785, 20.888063430786133, 22.466135025024414, 24.044206619262695, 25.622278213500977, 27.200349807739258, 28.778423309326172, 30.356494903564453, 31.934566497802734, 33.512638092041016, 35.0907096862793, 36.66878128051758, 38.24685287475586, 39.82492446899414, 41.40299606323242, 42.9810676574707, 44.559139251708984, 46.137210845947266, 47.71528244018555, 49.29335403442383, 50.87142562866211, 52.44949722290039, 54.02756881713867, 55.60564041137695, 57.183712005615234, 58.761783599853516, 60.3398551940918, 61.91792678833008, 63.49599838256836, 65.0740737915039, 66.65214538574219, 68.23021697998047, 69.80828857421875, 71.38636016845703, 72.96443176269531, 74.5425033569336, 76.12057495117188, 77.69864654541016, 79.27671813964844, 80.85478973388672, 82.432861328125, 84.01093292236328, 85.58900451660156, 87.16707611083984, 88.74514770507812, 90.3232192993164, 91.90129089355469, 93.47936248779297, 95.05743408203125]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 8.0, 10.0, 12.0, 20.0, 25.0, 23.0, 24.0, 31.0, 27.0, 25.0, 35.0, 37.0, 41.0, 48.0, 43.0, 36.0, 39.0, 45.0, 51.0, 41.0, 42.0, 38.0, 38.0, 38.0, 24.0, 27.0, 17.0, 21.0, 24.0, 14.0, 16.0, 14.0, 14.0, 11.0, 3.0, 7.0, 5.0, 3.0, 2.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.34609603881836, -48.606353759765625, -46.866615295410156, -45.12687301635742, -43.38713073730469, -41.64738845825195, -39.90764617919922, -38.16790771484375, -36.428165435791016, -34.68842315673828, -32.94868469238281, -31.208942413330078, -29.469200134277344, -27.72945785522461, -25.989717483520508, -24.249977111816406, -22.510234832763672, -20.770492553710938, -19.030752182006836, -17.291011810302734, -15.55126953125, -13.811528205871582, -12.071786880493164, -10.332045555114746, -8.592304229736328, -6.85256290435791, -5.112821578979492, -3.373080253601074, -1.6333389282226562, 0.10640239715576172, 1.8461437225341797, 3.5858850479125977, 5.32562255859375, 7.065363883972168, 8.805105209350586, 10.544846534729004, 12.284587860107422, 14.02432918548584, 15.764070510864258, 17.50381088256836, 19.243553161621094, 20.983295440673828, 22.72303581237793, 24.46277618408203, 26.202518463134766, 27.9422607421875, 29.6820011138916, 31.421741485595703, 33.16148376464844, 34.90122604370117, 36.640968322753906, 38.380706787109375, 40.12044906616211, 41.860191345214844, 43.59992980957031, 45.33967208862305, 47.07941436767578, 48.819156646728516, 50.55889892578125, 52.29863739013672, 54.03837966918945, 55.77812194824219, 57.517860412597656, 59.25760269165039, 60.997344970703125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 7.0, 5.0, 3.0, 6.0, 5.0, 9.0, 9.0, 10.0, 14.0, 18.0, 20.0, 20.0, 24.0, 22.0, 30.0, 28.0, 36.0, 49.0, 32.0, 33.0, 39.0, 44.0, 42.0, 41.0, 37.0, 39.0, 47.0, 38.0, 27.0, 20.0, 26.0, 32.0, 17.0, 25.0, 24.0, 25.0, 14.0, 9.0, 12.0, 11.0, 5.0, 15.0, 9.0, 7.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.7109375, -4.5716552734375, -4.432373046875, -4.2930908203125, -4.15380859375, -4.0145263671875, -3.875244140625, -3.7359619140625, -3.5966796875, -3.4573974609375, -3.318115234375, -3.1788330078125, -3.03955078125, -2.9002685546875, -2.760986328125, -2.6217041015625, -2.482421875, -2.3431396484375, -2.203857421875, -2.0645751953125, -1.92529296875, -1.7860107421875, -1.646728515625, -1.5074462890625, -1.3681640625, -1.2288818359375, -1.089599609375, -0.9503173828125, -0.81103515625, -0.6717529296875, -0.532470703125, -0.3931884765625, -0.25390625, -0.1146240234375, 0.024658203125, 0.1639404296875, 0.30322265625, 0.4425048828125, 0.581787109375, 0.7210693359375, 0.8603515625, 0.9996337890625, 1.138916015625, 1.2781982421875, 1.41748046875, 1.5567626953125, 1.696044921875, 1.8353271484375, 1.974609375, 2.1138916015625, 2.253173828125, 2.3924560546875, 2.53173828125, 2.6710205078125, 2.810302734375, 2.9495849609375, 3.0888671875, 3.2281494140625, 3.367431640625, 3.5067138671875, 3.64599609375, 3.7852783203125, 3.924560546875, 4.0638427734375, 4.203125]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 4.0, 2.0, 6.0, 10.0, 7.0, 6.0, 23.0, 7.0, 27.0, 20.0, 35.0, 32.0, 43.0, 54.0, 85.0, 158.0, 338.0, 869.0, 3288.0, 17966.0, 176590.0, 2157849.0, 1693946.0, 124673.0, 14020.0, 2642.0, 744.0, 309.0, 142.0, 80.0, 71.0, 48.0, 30.0, 22.0, 21.0, 22.0, 7.0, 7.0, 17.0, 13.0, 7.0, 7.0, 6.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-13.9375, -13.5267333984375, -13.115966796875, -12.7052001953125, -12.29443359375, -11.8836669921875, -11.472900390625, -11.0621337890625, -10.6513671875, -10.2406005859375, -9.829833984375, -9.4190673828125, -9.00830078125, -8.5975341796875, -8.186767578125, -7.7760009765625, -7.365234375, -6.9544677734375, -6.543701171875, -6.1329345703125, -5.72216796875, -5.3114013671875, -4.900634765625, -4.4898681640625, -4.0791015625, -3.6683349609375, -3.257568359375, -2.8468017578125, -2.43603515625, -2.0252685546875, -1.614501953125, -1.2037353515625, -0.79296875, -0.3822021484375, 0.028564453125, 0.4393310546875, 0.85009765625, 1.2608642578125, 1.671630859375, 2.0823974609375, 2.4931640625, 2.9039306640625, 3.314697265625, 3.7254638671875, 4.13623046875, 4.5469970703125, 4.957763671875, 5.3685302734375, 5.779296875, 6.1900634765625, 6.600830078125, 7.0115966796875, 7.42236328125, 7.8331298828125, 8.243896484375, 8.6546630859375, 9.0654296875, 9.4761962890625, 9.886962890625, 10.2977294921875, 10.70849609375, 11.1192626953125, 11.530029296875, 11.9407958984375, 12.3515625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 3.0, 5.0, 11.0, 11.0, 16.0, 12.0, 29.0, 34.0, 35.0, 26.0, 71.0, 76.0, 99.0, 122.0, 155.0, 201.0, 229.0, 269.0, 295.0, 328.0, 346.0, 298.0, 266.0, 205.0, 207.0, 145.0, 113.0, 105.0, 80.0, 62.0, 36.0, 42.0, 34.0, 26.0, 14.0, 12.0, 18.0, 10.0, 3.0, 5.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.0234375, -9.73583984375, -9.4482421875, -9.16064453125, -8.873046875, -8.58544921875, -8.2978515625, -8.01025390625, -7.72265625, -7.43505859375, -7.1474609375, -6.85986328125, -6.572265625, -6.28466796875, -5.9970703125, -5.70947265625, -5.421875, -5.13427734375, -4.8466796875, -4.55908203125, -4.271484375, -3.98388671875, -3.6962890625, -3.40869140625, -3.12109375, -2.83349609375, -2.5458984375, -2.25830078125, -1.970703125, -1.68310546875, -1.3955078125, -1.10791015625, -0.8203125, -0.53271484375, -0.2451171875, 0.04248046875, 0.330078125, 0.61767578125, 0.9052734375, 1.19287109375, 1.48046875, 1.76806640625, 2.0556640625, 2.34326171875, 2.630859375, 2.91845703125, 3.2060546875, 3.49365234375, 3.78125, 4.06884765625, 4.3564453125, 4.64404296875, 4.931640625, 5.21923828125, 5.5068359375, 5.79443359375, 6.08203125, 6.36962890625, 6.6572265625, 6.94482421875, 7.232421875, 7.52001953125, 7.8076171875, 8.09521484375, 8.3828125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 6.0, 8.0, 10.0, 8.0, 17.0, 18.0, 41.0, 68.0, 48.0, 99.0, 158.0, 208.0, 356.0, 1049.0, 10362.0, 816026.0, 3328461.0, 34276.0, 1835.0, 447.0, 249.0, 165.0, 111.0, 68.0, 59.0, 39.0, 28.0, 13.0, 17.0, 8.0, 9.0, 5.0, 9.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.84375, -34.5244140625, -33.205078125, -31.8857421875, -30.56640625, -29.2470703125, -27.927734375, -26.6083984375, -25.2890625, -23.9697265625, -22.650390625, -21.3310546875, -20.01171875, -18.6923828125, -17.373046875, -16.0537109375, -14.734375, -13.4150390625, -12.095703125, -10.7763671875, -9.45703125, -8.1376953125, -6.818359375, -5.4990234375, -4.1796875, -2.8603515625, -1.541015625, -0.2216796875, 1.09765625, 2.4169921875, 3.736328125, 5.0556640625, 6.375, 7.6943359375, 9.013671875, 10.3330078125, 11.65234375, 12.9716796875, 14.291015625, 15.6103515625, 16.9296875, 18.2490234375, 19.568359375, 20.8876953125, 22.20703125, 23.5263671875, 24.845703125, 26.1650390625, 27.484375, 28.8037109375, 30.123046875, 31.4423828125, 32.76171875, 34.0810546875, 35.400390625, 36.7197265625, 38.0390625, 39.3583984375, 40.677734375, 41.9970703125, 43.31640625, 44.6357421875, 45.955078125, 47.2744140625, 48.59375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 12.0, 41.0, 120.0, 231.0, 240.0, 206.0, 103.0, 42.0, 13.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.62589263916016, -101.90959930419922, -98.19331359863281, -94.47702026367188, -90.76072692871094, -87.04444122314453, -83.3281478881836, -79.61186218261719, -75.89556884765625, -72.17927551269531, -68.4629898071289, -64.74669647216797, -61.0304069519043, -57.314117431640625, -53.59782409667969, -49.881534576416016, -46.165245056152344, -42.44895553588867, -38.732666015625, -35.01637268066406, -31.30008316040039, -27.58379364013672, -23.867502212524414, -20.15121078491211, -16.434921264648438, -12.71863079071045, -9.002340316772461, -5.286049842834473, -1.5697593688964844, 2.1465301513671875, 5.862821578979492, 9.579113006591797, 13.295394897460938, 17.01168441772461, 20.727975845336914, 24.44426727294922, 28.16055679321289, 31.876846313476562, 35.5931396484375, 39.30942916870117, 43.025718688964844, 46.742008209228516, 50.45829772949219, 54.174591064453125, 57.8908805847168, 61.60717010498047, 65.3234634399414, 69.03974914550781, 72.75604248046875, 76.47233581542969, 80.1886215209961, 83.90491485595703, 87.62120056152344, 91.33749389648438, 95.05378723144531, 98.77008056640625, 102.48636627197266, 106.2026596069336, 109.9189453125, 113.63523864746094, 117.35153198242188, 121.06781768798828, 124.78411102294922, 128.50039672851562, 132.21669006347656]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 4.0, 5.0, 7.0, 13.0, 8.0, 7.0, 9.0, 11.0, 9.0, 17.0, 15.0, 21.0, 16.0, 27.0, 29.0, 31.0, 27.0, 36.0, 36.0, 35.0, 33.0, 36.0, 33.0, 33.0, 65.0, 45.0, 45.0, 39.0, 28.0, 31.0, 28.0, 30.0, 32.0, 30.0, 23.0, 22.0, 18.0, 16.0, 16.0, 7.0, 8.0, 7.0, 4.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-40.88726806640625, -39.69952392578125, -38.51177978515625, -37.324031829833984, -36.136287689208984, -34.948543548583984, -33.760799407958984, -32.573055267333984, -31.38530921936035, -30.19756507873535, -29.00981903076172, -27.82207489013672, -26.63433074951172, -25.446584701538086, -24.258840560913086, -23.071094512939453, -21.883350372314453, -20.695606231689453, -19.50786018371582, -18.32011604309082, -17.132369995117188, -15.944625854492188, -14.756881713867188, -13.569136619567871, -12.381391525268555, -11.193646430969238, -10.005901336669922, -8.818157196044922, -7.6304121017456055, -6.442667007446289, -5.254922389984131, -4.067177772521973, -2.8794326782226562, -1.691687822341919, -0.5039429664611816, 0.6838018894195557, 1.871546745300293, 3.0592918395996094, 4.247036457061768, 5.434781074523926, 6.622526168823242, 7.810271263122559, 8.998016357421875, 10.185760498046875, 11.373505592346191, 12.561250686645508, 13.748994827270508, 14.936739921569824, 16.12448501586914, 17.31222915649414, 18.499975204467773, 19.687719345092773, 20.875465393066406, 22.063209533691406, 23.250953674316406, 24.438697814941406, 25.62644386291504, 26.81418800354004, 28.001934051513672, 29.189678192138672, 30.377422332763672, 31.565168380737305, 32.75291442871094, 33.94065856933594, 35.12840270996094]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 3.0, 11.0, 4.0, 7.0, 13.0, 6.0, 24.0, 15.0, 22.0, 24.0, 28.0, 36.0, 37.0, 36.0, 26.0, 44.0, 38.0, 42.0, 37.0, 41.0, 44.0, 44.0, 35.0, 47.0, 48.0, 22.0, 32.0, 28.0, 22.0, 20.0, 25.0, 17.0, 11.0, 23.0, 12.0, 10.0, 13.0, 8.0, 8.0, 9.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.84375, -4.69500732421875, -4.5462646484375, -4.39752197265625, -4.248779296875, -4.10003662109375, -3.9512939453125, -3.80255126953125, -3.65380859375, -3.50506591796875, -3.3563232421875, -3.20758056640625, -3.058837890625, -2.91009521484375, -2.7613525390625, -2.61260986328125, -2.4638671875, -2.31512451171875, -2.1663818359375, -2.01763916015625, -1.868896484375, -1.72015380859375, -1.5714111328125, -1.42266845703125, -1.27392578125, -1.12518310546875, -0.9764404296875, -0.82769775390625, -0.678955078125, -0.53021240234375, -0.3814697265625, -0.23272705078125, -0.083984375, 0.06475830078125, 0.2135009765625, 0.36224365234375, 0.510986328125, 0.65972900390625, 0.8084716796875, 0.95721435546875, 1.10595703125, 1.25469970703125, 1.4034423828125, 1.55218505859375, 1.700927734375, 1.84967041015625, 1.9984130859375, 2.14715576171875, 2.2958984375, 2.44464111328125, 2.5933837890625, 2.74212646484375, 2.890869140625, 3.03961181640625, 3.1883544921875, 3.33709716796875, 3.48583984375, 3.63458251953125, 3.7833251953125, 3.93206787109375, 4.080810546875, 4.22955322265625, 4.3782958984375, 4.52703857421875, 4.67578125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 9.0, 19.0, 25.0, 38.0, 65.0, 72.0, 110.0, 183.0, 280.0, 392.0, 624.0, 940.0, 1435.0, 2248.0, 3267.0, 5049.0, 7856.0, 11987.0, 18912.0, 30894.0, 51417.0, 88539.0, 151990.0, 217346.0, 180610.0, 109456.0, 63199.0, 37554.0, 22791.0, 14554.0, 9280.0, 5975.0, 4019.0, 2507.0, 1644.0, 1128.0, 732.0, 461.0, 316.0, 226.0, 125.0, 125.0, 53.0, 32.0, 32.0, 18.0, 10.0, 9.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.59814453125, -0.5798492431640625, -0.561553955078125, -0.5432586669921875, -0.52496337890625, -0.5066680908203125, -0.488372802734375, -0.4700775146484375, -0.4517822265625, -0.4334869384765625, -0.415191650390625, -0.3968963623046875, -0.37860107421875, -0.3603057861328125, -0.342010498046875, -0.3237152099609375, -0.305419921875, -0.2871246337890625, -0.268829345703125, -0.2505340576171875, -0.23223876953125, -0.2139434814453125, -0.195648193359375, -0.1773529052734375, -0.1590576171875, -0.1407623291015625, -0.122467041015625, -0.1041717529296875, -0.08587646484375, -0.0675811767578125, -0.049285888671875, -0.0309906005859375, -0.0126953125, 0.0055999755859375, 0.023895263671875, 0.0421905517578125, 0.06048583984375, 0.0787811279296875, 0.097076416015625, 0.1153717041015625, 0.1336669921875, 0.1519622802734375, 0.170257568359375, 0.1885528564453125, 0.20684814453125, 0.2251434326171875, 0.243438720703125, 0.2617340087890625, 0.280029296875, 0.2983245849609375, 0.316619873046875, 0.3349151611328125, 0.35321044921875, 0.3715057373046875, 0.389801025390625, 0.4080963134765625, 0.4263916015625, 0.4446868896484375, 0.462982177734375, 0.4812774658203125, 0.49957275390625, 0.5178680419921875, 0.536163330078125, 0.5544586181640625, 0.57275390625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 5.0, 2.0, 10.0, 12.0, 15.0, 16.0, 24.0, 11.0, 18.0, 20.0, 27.0, 22.0, 29.0, 20.0, 33.0, 33.0, 35.0, 45.0, 36.0, 41.0, 1071.0, 48.0, 31.0, 37.0, 44.0, 35.0, 26.0, 29.0, 33.0, 26.0, 20.0, 23.0, 28.0, 21.0, 22.0, 13.0, 11.0, 12.0, 6.0, 10.0, 2.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.8046875, -2.7138671875, -2.623046875, -2.5322265625, -2.44140625, -2.3505859375, -2.259765625, -2.1689453125, -2.078125, -1.9873046875, -1.896484375, -1.8056640625, -1.71484375, -1.6240234375, -1.533203125, -1.4423828125, -1.3515625, -1.2607421875, -1.169921875, -1.0791015625, -0.98828125, -0.8974609375, -0.806640625, -0.7158203125, -0.625, -0.5341796875, -0.443359375, -0.3525390625, -0.26171875, -0.1708984375, -0.080078125, 0.0107421875, 0.1015625, 0.1923828125, 0.283203125, 0.3740234375, 0.46484375, 0.5556640625, 0.646484375, 0.7373046875, 0.828125, 0.9189453125, 1.009765625, 1.1005859375, 1.19140625, 1.2822265625, 1.373046875, 1.4638671875, 1.5546875, 1.6455078125, 1.736328125, 1.8271484375, 1.91796875, 2.0087890625, 2.099609375, 2.1904296875, 2.28125, 2.3720703125, 2.462890625, 2.5537109375, 2.64453125, 2.7353515625, 2.826171875, 2.9169921875, 3.0078125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 9.0, 10.0, 18.0, 13.0, 48.0, 50.0, 94.0, 106.0, 168.0, 304.0, 469.0, 686.0, 1123.0, 1656.0, 2774.0, 4838.0, 8208.0, 14888.0, 27846.0, 52514.0, 104304.0, 198725.0, 1309728.0, 175951.0, 90552.0, 45995.0, 24332.0, 13320.0, 7334.0, 4363.0, 2527.0, 1530.0, 943.0, 607.0, 375.0, 237.0, 172.0, 96.0, 84.0, 35.0, 33.0, 17.0, 11.0, 17.0, 9.0, 8.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-0.6904296875, -0.6703567504882812, -0.6502838134765625, -0.6302108764648438, -0.610137939453125, -0.5900650024414062, -0.5699920654296875, -0.5499191284179688, -0.52984619140625, -0.5097732543945312, -0.4897003173828125, -0.46962738037109375, -0.449554443359375, -0.42948150634765625, -0.4094085693359375, -0.38933563232421875, -0.3692626953125, -0.34918975830078125, -0.3291168212890625, -0.30904388427734375, -0.288970947265625, -0.26889801025390625, -0.2488250732421875, -0.22875213623046875, -0.20867919921875, -0.18860626220703125, -0.1685333251953125, -0.14846038818359375, -0.128387451171875, -0.10831451416015625, -0.0882415771484375, -0.06816864013671875, -0.048095703125, -0.02802276611328125, -0.0079498291015625, 0.01212310791015625, 0.032196044921875, 0.05226898193359375, 0.0723419189453125, 0.09241485595703125, 0.11248779296875, 0.13256072998046875, 0.1526336669921875, 0.17270660400390625, 0.192779541015625, 0.21285247802734375, 0.2329254150390625, 0.25299835205078125, 0.2730712890625, 0.29314422607421875, 0.3132171630859375, 0.33329010009765625, 0.353363037109375, 0.37343597412109375, 0.3935089111328125, 0.41358184814453125, 0.43365478515625, 0.45372772216796875, 0.4738006591796875, 0.49387359619140625, 0.513946533203125, 0.5340194702148438, 0.5540924072265625, 0.5741653442382812, 0.59423828125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 5.0, 8.0, 5.0, 17.0, 9.0, 25.0, 32.0, 21.0, 35.0, 43.0, 36.0, 47.0, 72.0, 64.0, 61.0, 78.0, 66.0, 72.0, 50.0, 39.0, 38.0, 30.0, 29.0, 21.0, 25.0, 16.0, 13.0, 13.0, 7.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014171600341796875, -0.001368105411529541, -0.0013190507888793945, -0.001269996166229248, -0.0012209415435791016, -0.001171886920928955, -0.0011228322982788086, -0.0010737776756286621, -0.0010247230529785156, -0.0009756684303283691, -0.0009266138076782227, -0.0008775591850280762, -0.0008285045623779297, -0.0007794499397277832, -0.0007303953170776367, -0.0006813406944274902, -0.0006322860717773438, -0.0005832314491271973, -0.0005341768264770508, -0.0004851222038269043, -0.0004360675811767578, -0.00038701295852661133, -0.00033795833587646484, -0.00028890371322631836, -0.00023984909057617188, -0.0001907944679260254, -0.0001417398452758789, -9.268522262573242e-05, -4.363059997558594e-05, 5.424022674560547e-06, 5.447864532470703e-05, 0.00010353326797485352, 0.000152587890625, 0.00020164251327514648, 0.00025069713592529297, 0.00029975175857543945, 0.00034880638122558594, 0.0003978610038757324, 0.0004469156265258789, 0.0004959702491760254, 0.0005450248718261719, 0.0005940794944763184, 0.0006431341171264648, 0.0006921887397766113, 0.0007412433624267578, 0.0007902979850769043, 0.0008393526077270508, 0.0008884072303771973, 0.0009374618530273438, 0.0009865164756774902, 0.0010355710983276367, 0.0010846257209777832, 0.0011336803436279297, 0.0011827349662780762, 0.0012317895889282227, 0.0012808442115783691, 0.0013298988342285156, 0.0013789534568786621, 0.0014280080795288086, 0.001477062702178955, 0.0015261173248291016, 0.001575171947479248, 0.0016242265701293945, 0.001673281192779541, 0.0017223358154296875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 16.0, 10.0, 11.0, 17.0, 33.0, 48.0, 50.0, 79.0, 119.0, 195.0, 361.0, 768.0, 26490.0, 1017326.0, 1723.0, 523.0, 265.0, 160.0, 102.0, 74.0, 41.0, 35.0, 20.0, 15.0, 17.0, 8.0, 6.0, 8.0, 6.0, 4.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.038421630859375, -0.03736257553100586, -0.03630352020263672, -0.03524446487426758, -0.03418540954589844, -0.0331263542175293, -0.032067298889160156, -0.031008243560791016, -0.029949188232421875, -0.028890132904052734, -0.027831077575683594, -0.026772022247314453, -0.025712966918945312, -0.024653911590576172, -0.02359485626220703, -0.02253580093383789, -0.02147674560546875, -0.02041769027709961, -0.01935863494873047, -0.018299579620361328, -0.017240524291992188, -0.016181468963623047, -0.015122413635253906, -0.014063358306884766, -0.013004302978515625, -0.011945247650146484, -0.010886192321777344, -0.009827136993408203, -0.008768081665039062, -0.007709026336669922, -0.006649971008300781, -0.005590915679931641, -0.0045318603515625, -0.0034728050231933594, -0.0024137496948242188, -0.0013546943664550781, -0.0002956390380859375, 0.0007634162902832031, 0.0018224716186523438, 0.0028815269470214844, 0.003940582275390625, 0.004999637603759766, 0.006058692932128906, 0.007117748260498047, 0.008176803588867188, 0.009235858917236328, 0.010294914245605469, 0.01135396957397461, 0.01241302490234375, 0.01347208023071289, 0.014531135559082031, 0.015590190887451172, 0.016649246215820312, 0.017708301544189453, 0.018767356872558594, 0.019826412200927734, 0.020885467529296875, 0.021944522857666016, 0.023003578186035156, 0.024062633514404297, 0.025121688842773438, 0.026180744171142578, 0.02723979949951172, 0.02829885482788086, 0.02935791015625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 183.0, 553.0, 247.0, 20.0, 1.0, 0.0, 1.0], "bins": [-0.00814589112997055, -0.008006857708096504, -0.007867824286222458, -0.007728790398687124, -0.007589756511151791, -0.007450723089277744, -0.007311689201742411, -0.007172655779868364, -0.007033621892333031, -0.006894588470458984, -0.006755554582923651, -0.006616521161049604, -0.006477487273514271, -0.0063384538516402245, -0.006199419964104891, -0.0060603865422308445, -0.005921352654695511, -0.0057823192328214645, -0.005643285345286131, -0.005504251923412085, -0.005365218035876751, -0.005226184614002705, -0.005087150726467371, -0.004948117304593325, -0.004809083882719278, -0.004670050460845232, -0.004531016573309898, -0.004391983151435852, -0.004252949263900518, -0.004113915842026472, -0.0039748819544911385, -0.003835848532617092, -0.003696815110743046, -0.003557781456038356, -0.003418747801333666, -0.003279714146628976, -0.003140680491924286, -0.003001646837219596, -0.002862613182514906, -0.0027235797606408596, -0.002584545873105526, -0.002445512218400836, -0.002306478563696146, -0.002167444908991456, -0.002028411254286766, -0.001889377599582076, -0.001750344061292708, -0.001611310406588018, -0.001472276751883328, -0.001333243097178638, -0.001194209442473948, -0.0010551759041845798, -0.000916142191272229, -0.000777108536567539, -0.0006380749400705099, -0.0004990412853658199, -0.00036000763066112995, -0.0002209739905083552, -8.194035035558045e-05, 5.7093275245279074e-05, 0.00019612692994996905, 0.00033516058465465903, 0.0004741941811516881, 0.0006132278358563781, 0.0007522614905610681]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 8.0, 3.0, 6.0, 8.0, 15.0, 11.0, 12.0, 22.0, 10.0, 20.0, 20.0, 35.0, 19.0, 35.0, 39.0, 33.0, 36.0, 45.0, 39.0, 43.0, 45.0, 38.0, 41.0, 43.0, 48.0, 39.0, 30.0, 37.0, 32.0, 32.0, 25.0, 24.0, 19.0, 24.0, 13.0, 14.0, 9.0, 10.0, 13.0, 5.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007391571998596191, -0.000714525580406189, -0.0006898939609527588, -0.0006652623414993286, -0.0006406307220458984, -0.0006159991025924683, -0.0005913674831390381, -0.0005667358636856079, -0.0005421042442321777, -0.0005174726247787476, -0.0004928410053253174, -0.0004682093858718872, -0.00044357776641845703, -0.00041894614696502686, -0.0003943145275115967, -0.0003696829080581665, -0.00034505128860473633, -0.00032041966915130615, -0.000295788049697876, -0.0002711564302444458, -0.0002465248107910156, -0.00022189319133758545, -0.00019726157188415527, -0.0001726299524307251, -0.00014799833297729492, -0.00012336671352386475, -9.873509407043457e-05, -7.41034746170044e-05, -4.947185516357422e-05, -2.4840235710144043e-05, -2.086162567138672e-07, 2.442300319671631e-05, 4.9054622650146484e-05, 7.368624210357666e-05, 9.831786155700684e-05, 0.000122949481010437, 0.0001475811004638672, 0.00017221271991729736, 0.00019684433937072754, 0.00022147595882415771, 0.0002461075782775879, 0.00027073919773101807, 0.00029537081718444824, 0.0003200024366378784, 0.0003446340560913086, 0.00036926567554473877, 0.00039389729499816895, 0.0004185289144515991, 0.0004431605339050293, 0.00046779215335845947, 0.0004924237728118896, 0.0005170553922653198, 0.00054168701171875, 0.0005663186311721802, 0.0005909502506256104, 0.0006155818700790405, 0.0006402134895324707, 0.0006648451089859009, 0.0006894767284393311, 0.0007141083478927612, 0.0007387399673461914, 0.0007633715867996216, 0.0007880032062530518, 0.0008126348257064819, 0.0008372664451599121]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 3.0, 11.0, 4.0, 7.0, 13.0, 6.0, 24.0, 15.0, 22.0, 24.0, 28.0, 36.0, 37.0, 35.0, 27.0, 44.0, 38.0, 42.0, 37.0, 41.0, 44.0, 44.0, 35.0, 47.0, 48.0, 22.0, 32.0, 28.0, 22.0, 20.0, 25.0, 17.0, 11.0, 23.0, 12.0, 10.0, 13.0, 8.0, 8.0, 9.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.84375, -4.69500732421875, -4.5462646484375, -4.39752197265625, -4.248779296875, -4.10003662109375, -3.9512939453125, -3.80255126953125, -3.65380859375, -3.50506591796875, -3.3563232421875, -3.20758056640625, -3.058837890625, -2.91009521484375, -2.7613525390625, -2.61260986328125, -2.4638671875, -2.31512451171875, -2.1663818359375, -2.01763916015625, -1.868896484375, -1.72015380859375, -1.5714111328125, -1.42266845703125, -1.27392578125, -1.12518310546875, -0.9764404296875, -0.82769775390625, -0.678955078125, -0.53021240234375, -0.3814697265625, -0.23272705078125, -0.083984375, 0.06475830078125, 0.2135009765625, 0.36224365234375, 0.510986328125, 0.65972900390625, 0.8084716796875, 0.95721435546875, 1.10595703125, 1.25469970703125, 1.4034423828125, 1.55218505859375, 1.700927734375, 1.84967041015625, 1.9984130859375, 2.14715576171875, 2.2958984375, 2.44464111328125, 2.5933837890625, 2.74212646484375, 2.890869140625, 3.03961181640625, 3.1883544921875, 3.33709716796875, 3.48583984375, 3.63458251953125, 3.7833251953125, 3.93206787109375, 4.080810546875, 4.22955322265625, 4.3782958984375, 4.52703857421875, 4.67578125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 11.0, 26.0, 25.0, 40.0, 57.0, 95.0, 149.0, 219.0, 363.0, 534.0, 851.0, 1359.0, 2311.0, 3654.0, 6212.0, 11470.0, 25431.0, 72721.0, 307773.0, 449352.0, 100646.0, 32904.0, 14226.0, 7337.0, 4025.0, 2505.0, 1534.0, 998.0, 590.0, 396.0, 229.0, 175.0, 102.0, 70.0, 43.0, 37.0, 24.0, 18.0, 13.0, 8.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.70562744140625, -4.5635986328125, -4.42156982421875, -4.279541015625, -4.13751220703125, -3.9954833984375, -3.85345458984375, -3.71142578125, -3.56939697265625, -3.4273681640625, -3.28533935546875, -3.143310546875, -3.00128173828125, -2.8592529296875, -2.71722412109375, -2.5751953125, -2.43316650390625, -2.2911376953125, -2.14910888671875, -2.007080078125, -1.86505126953125, -1.7230224609375, -1.58099365234375, -1.43896484375, -1.29693603515625, -1.1549072265625, -1.01287841796875, -0.870849609375, -0.72882080078125, -0.5867919921875, -0.44476318359375, -0.302734375, -0.16070556640625, -0.0186767578125, 0.12335205078125, 0.265380859375, 0.40740966796875, 0.5494384765625, 0.69146728515625, 0.83349609375, 0.97552490234375, 1.1175537109375, 1.25958251953125, 1.401611328125, 1.54364013671875, 1.6856689453125, 1.82769775390625, 1.9697265625, 2.11175537109375, 2.2537841796875, 2.39581298828125, 2.537841796875, 2.67987060546875, 2.8218994140625, 2.96392822265625, 3.10595703125, 3.24798583984375, 3.3900146484375, 3.53204345703125, 3.674072265625, 3.81610107421875, 3.9581298828125, 4.10015869140625, 4.2421875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 6.0, 11.0, 9.0, 9.0, 15.0, 10.0, 14.0, 11.0, 14.0, 23.0, 19.0, 29.0, 19.0, 33.0, 35.0, 33.0, 43.0, 49.0, 69.0, 103.0, 385.0, 1540.0, 128.0, 66.0, 32.0, 38.0, 41.0, 22.0, 21.0, 40.0, 29.0, 17.0, 18.0, 20.0, 19.0, 18.0, 9.0, 9.0, 5.0, 13.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0], "bins": [-17.109375, -16.6217041015625, -16.134033203125, -15.6463623046875, -15.15869140625, -14.6710205078125, -14.183349609375, -13.6956787109375, -13.2080078125, -12.7203369140625, -12.232666015625, -11.7449951171875, -11.25732421875, -10.7696533203125, -10.281982421875, -9.7943115234375, -9.306640625, -8.8189697265625, -8.331298828125, -7.8436279296875, -7.35595703125, -6.8682861328125, -6.380615234375, -5.8929443359375, -5.4052734375, -4.9176025390625, -4.429931640625, -3.9422607421875, -3.45458984375, -2.9669189453125, -2.479248046875, -1.9915771484375, -1.50390625, -1.0162353515625, -0.528564453125, -0.0408935546875, 0.44677734375, 0.9344482421875, 1.422119140625, 1.9097900390625, 2.3974609375, 2.8851318359375, 3.372802734375, 3.8604736328125, 4.34814453125, 4.8358154296875, 5.323486328125, 5.8111572265625, 6.298828125, 6.7864990234375, 7.274169921875, 7.7618408203125, 8.24951171875, 8.7371826171875, 9.224853515625, 9.7125244140625, 10.2001953125, 10.6878662109375, 11.175537109375, 11.6632080078125, 12.15087890625, 12.6385498046875, 13.126220703125, 13.6138916015625, 14.1015625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 3.0, 6.0, 6.0, 8.0, 13.0, 15.0, 28.0, 29.0, 43.0, 62.0, 84.0, 117.0, 219.0, 413.0, 1382.0, 31754.0, 3094123.0, 15324.0, 1057.0, 380.0, 182.0, 131.0, 93.0, 53.0, 41.0, 37.0, 20.0, 23.0, 20.0, 12.0, 6.0, 8.0, 5.0, 6.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.375, -46.07421875, -44.7734375, -43.47265625, -42.171875, -40.87109375, -39.5703125, -38.26953125, -36.96875, -35.66796875, -34.3671875, -33.06640625, -31.765625, -30.46484375, -29.1640625, -27.86328125, -26.5625, -25.26171875, -23.9609375, -22.66015625, -21.359375, -20.05859375, -18.7578125, -17.45703125, -16.15625, -14.85546875, -13.5546875, -12.25390625, -10.953125, -9.65234375, -8.3515625, -7.05078125, -5.75, -4.44921875, -3.1484375, -1.84765625, -0.546875, 0.75390625, 2.0546875, 3.35546875, 4.65625, 5.95703125, 7.2578125, 8.55859375, 9.859375, 11.16015625, 12.4609375, 13.76171875, 15.0625, 16.36328125, 17.6640625, 18.96484375, 20.265625, 21.56640625, 22.8671875, 24.16796875, 25.46875, 26.76953125, 28.0703125, 29.37109375, 30.671875, 31.97265625, 33.2734375, 34.57421875, 35.875]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 20.0, 31.0, 59.0, 89.0, 123.0, 174.0, 162.0, 148.0, 81.0, 45.0, 36.0, 15.0, 13.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-32.12801742553711, -31.427978515625, -30.72793960571289, -30.02790069580078, -29.32785987854004, -28.62782096862793, -27.92778205871582, -27.22774314880371, -26.5277042388916, -25.827665328979492, -25.127626419067383, -24.42758560180664, -23.72754669189453, -23.027507781982422, -22.327468872070312, -21.627429962158203, -20.927391052246094, -20.227352142333984, -19.527313232421875, -18.827274322509766, -18.127233505249023, -17.427194595336914, -16.727155685424805, -16.027116775512695, -15.327075958251953, -14.627037048339844, -13.926997184753418, -13.226958274841309, -12.5269193649292, -11.826879501342773, -11.126840591430664, -10.426801681518555, -9.726763725280762, -9.026724815368652, -8.326684951782227, -7.626646041870117, -6.926607131958008, -6.22656774520874, -5.526528358459473, -4.826489448547363, -4.126450061798096, -3.4264109134674072, -2.7263717651367188, -2.026332378387451, -1.3262932300567627, -0.6262540817260742, 0.07378530502319336, 0.7738242149353027, 1.4738636016845703, 2.173902750015259, 2.8739418983459473, 3.573981285095215, 4.274020195007324, 4.974059581756592, 5.674098968505859, 6.374137878417969, 7.074177265167236, 7.774216651916504, 8.474255561828613, 9.174295425415039, 9.874334335327148, 10.574373245239258, 11.274412155151367, 11.974451065063477, 12.674490928649902]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 8.0, 4.0, 10.0, 15.0, 6.0, 13.0, 10.0, 21.0, 17.0, 19.0, 37.0, 22.0, 35.0, 42.0, 44.0, 41.0, 44.0, 48.0, 43.0, 33.0, 39.0, 44.0, 55.0, 43.0, 26.0, 30.0, 31.0, 29.0, 30.0, 31.0, 18.0, 14.0, 19.0, 16.0, 13.0, 10.0, 4.0, 8.0, 10.0, 4.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-52.263065338134766, -50.63752365112305, -49.01198196411133, -47.38644027709961, -45.76089859008789, -44.13535690307617, -42.50981903076172, -40.88427734375, -39.25873565673828, -37.63319396972656, -36.007652282714844, -34.382110595703125, -32.756568908691406, -31.131027221679688, -29.5054874420166, -27.879945755004883, -26.25440216064453, -24.628860473632812, -23.003318786621094, -21.377777099609375, -19.752235412597656, -18.126693725585938, -16.50115394592285, -14.875612258911133, -13.250070571899414, -11.624528884887695, -9.998987197875977, -8.373446464538574, -6.7479047775268555, -5.122363090515137, -3.4968223571777344, -1.8712806701660156, -0.2457427978515625, 1.3797986507415771, 3.005340099334717, 4.630881309509277, 6.256422996520996, 7.881964683532715, 9.507505416870117, 11.133047103881836, 12.758588790893555, 14.384130477905273, 16.009672164916992, 17.635211944580078, 19.260753631591797, 20.886295318603516, 22.511837005615234, 24.137378692626953, 25.762920379638672, 27.38846206665039, 29.01400375366211, 30.639545440673828, 32.26508712768555, 33.890628814697266, 35.51616668701172, 37.14170837402344, 38.767250061035156, 40.392791748046875, 42.018333435058594, 43.64387512207031, 45.26941680908203, 46.89495849609375, 48.52050018310547, 50.14604187011719, 51.771583557128906]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 8.0, 7.0, 8.0, 8.0, 8.0, 19.0, 14.0, 22.0, 25.0, 21.0, 29.0, 44.0, 31.0, 33.0, 43.0, 41.0, 39.0, 36.0, 48.0, 41.0, 26.0, 57.0, 47.0, 41.0, 29.0, 26.0, 31.0, 25.0, 23.0, 22.0, 26.0, 18.0, 16.0, 13.0, 7.0, 10.0, 15.0, 9.0, 9.0, 7.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -5.00384521484375, -4.8475341796875, -4.69122314453125, -4.534912109375, -4.37860107421875, -4.2222900390625, -4.06597900390625, -3.90966796875, -3.75335693359375, -3.5970458984375, -3.44073486328125, -3.284423828125, -3.12811279296875, -2.9718017578125, -2.81549072265625, -2.6591796875, -2.50286865234375, -2.3465576171875, -2.19024658203125, -2.033935546875, -1.87762451171875, -1.7213134765625, -1.56500244140625, -1.40869140625, -1.25238037109375, -1.0960693359375, -0.93975830078125, -0.783447265625, -0.62713623046875, -0.4708251953125, -0.31451416015625, -0.158203125, -0.00189208984375, 0.1544189453125, 0.31072998046875, 0.467041015625, 0.62335205078125, 0.7796630859375, 0.93597412109375, 1.09228515625, 1.24859619140625, 1.4049072265625, 1.56121826171875, 1.717529296875, 1.87384033203125, 2.0301513671875, 2.18646240234375, 2.3427734375, 2.49908447265625, 2.6553955078125, 2.81170654296875, 2.968017578125, 3.12432861328125, 3.2806396484375, 3.43695068359375, 3.59326171875, 3.74957275390625, 3.9058837890625, 4.06219482421875, 4.218505859375, 4.37481689453125, 4.5311279296875, 4.68743896484375, 4.84375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 6.0, 12.0, 13.0, 17.0, 43.0, 45.0, 71.0, 133.0, 245.0, 471.0, 960.0, 2002.0, 4873.0, 13122.0, 38554.0, 145099.0, 618847.0, 1576368.0, 1270077.0, 385505.0, 95094.0, 26966.0, 9269.0, 3553.0, 1451.0, 670.0, 321.0, 183.0, 102.0, 68.0, 39.0, 32.0, 21.0, 10.0, 15.0, 10.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.921875, -6.7110595703125, -6.500244140625, -6.2894287109375, -6.07861328125, -5.8677978515625, -5.656982421875, -5.4461669921875, -5.2353515625, -5.0245361328125, -4.813720703125, -4.6029052734375, -4.39208984375, -4.1812744140625, -3.970458984375, -3.7596435546875, -3.548828125, -3.3380126953125, -3.127197265625, -2.9163818359375, -2.70556640625, -2.4947509765625, -2.283935546875, -2.0731201171875, -1.8623046875, -1.6514892578125, -1.440673828125, -1.2298583984375, -1.01904296875, -0.8082275390625, -0.597412109375, -0.3865966796875, -0.17578125, 0.0350341796875, 0.245849609375, 0.4566650390625, 0.66748046875, 0.8782958984375, 1.089111328125, 1.2999267578125, 1.5107421875, 1.7215576171875, 1.932373046875, 2.1431884765625, 2.35400390625, 2.5648193359375, 2.775634765625, 2.9864501953125, 3.197265625, 3.4080810546875, 3.618896484375, 3.8297119140625, 4.04052734375, 4.2513427734375, 4.462158203125, 4.6729736328125, 4.8837890625, 5.0946044921875, 5.305419921875, 5.5162353515625, 5.72705078125, 5.9378662109375, 6.148681640625, 6.3594970703125, 6.5703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 6.0, 13.0, 11.0, 24.0, 17.0, 30.0, 24.0, 46.0, 71.0, 97.0, 148.0, 189.0, 243.0, 303.0, 390.0, 435.0, 449.0, 400.0, 289.0, 230.0, 195.0, 114.0, 98.0, 51.0, 57.0, 30.0, 36.0, 21.0, 14.0, 8.0, 12.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.3515625, -14.9674072265625, -14.583251953125, -14.1990966796875, -13.81494140625, -13.4307861328125, -13.046630859375, -12.6624755859375, -12.2783203125, -11.8941650390625, -11.510009765625, -11.1258544921875, -10.74169921875, -10.3575439453125, -9.973388671875, -9.5892333984375, -9.205078125, -8.8209228515625, -8.436767578125, -8.0526123046875, -7.66845703125, -7.2843017578125, -6.900146484375, -6.5159912109375, -6.1318359375, -5.7476806640625, -5.363525390625, -4.9793701171875, -4.59521484375, -4.2110595703125, -3.826904296875, -3.4427490234375, -3.05859375, -2.6744384765625, -2.290283203125, -1.9061279296875, -1.52197265625, -1.1378173828125, -0.753662109375, -0.3695068359375, 0.0146484375, 0.3988037109375, 0.782958984375, 1.1671142578125, 1.55126953125, 1.9354248046875, 2.319580078125, 2.7037353515625, 3.087890625, 3.4720458984375, 3.856201171875, 4.2403564453125, 4.62451171875, 5.0086669921875, 5.392822265625, 5.7769775390625, 6.1611328125, 6.5452880859375, 6.929443359375, 7.3135986328125, 7.69775390625, 8.0819091796875, 8.466064453125, 8.8502197265625, 9.234375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 10.0, 13.0, 23.0, 23.0, 36.0, 40.0, 58.0, 77.0, 87.0, 165.0, 259.0, 678.0, 3807.0, 120103.0, 3843109.0, 218990.0, 5147.0, 723.0, 315.0, 163.0, 106.0, 89.0, 49.0, 47.0, 30.0, 32.0, 28.0, 9.0, 13.0, 6.0, 4.0, 4.0, 8.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.59375, -37.3310546875, -36.068359375, -34.8056640625, -33.54296875, -32.2802734375, -31.017578125, -29.7548828125, -28.4921875, -27.2294921875, -25.966796875, -24.7041015625, -23.44140625, -22.1787109375, -20.916015625, -19.6533203125, -18.390625, -17.1279296875, -15.865234375, -14.6025390625, -13.33984375, -12.0771484375, -10.814453125, -9.5517578125, -8.2890625, -7.0263671875, -5.763671875, -4.5009765625, -3.23828125, -1.9755859375, -0.712890625, 0.5498046875, 1.8125, 3.0751953125, 4.337890625, 5.6005859375, 6.86328125, 8.1259765625, 9.388671875, 10.6513671875, 11.9140625, 13.1767578125, 14.439453125, 15.7021484375, 16.96484375, 18.2275390625, 19.490234375, 20.7529296875, 22.015625, 23.2783203125, 24.541015625, 25.8037109375, 27.06640625, 28.3291015625, 29.591796875, 30.8544921875, 32.1171875, 33.3798828125, 34.642578125, 35.9052734375, 37.16796875, 38.4306640625, 39.693359375, 40.9560546875, 42.21875]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 10.0, 38.0, 72.0, 159.0, 211.0, 211.0, 181.0, 79.0, 36.0, 12.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-170.3240966796875, -166.93434143066406, -163.54457092285156, -160.15481567382812, -156.7650604248047, -153.3752899169922, -149.98553466796875, -146.59576416015625, -143.2060089111328, -139.81625366210938, -136.42648315429688, -133.03672790527344, -129.64697265625, -126.2572021484375, -122.86744689941406, -119.4776840209961, -116.08792114257812, -112.69815826416016, -109.30840301513672, -105.91864013671875, -102.52887725830078, -99.13911437988281, -95.74935913085938, -92.3595962524414, -88.96984100341797, -85.580078125, -82.19032287597656, -78.8005599975586, -75.41079711914062, -72.02104187011719, -68.63127899169922, -65.24151611328125, -61.851749420166016, -58.46199035644531, -55.072227478027344, -51.68246841430664, -48.29270553588867, -44.90294647216797, -41.51318359375, -38.1234245300293, -34.733665466308594, -31.343904495239258, -27.954143524169922, -24.56438446044922, -21.17462158203125, -17.784862518310547, -14.395101547241211, -11.005340576171875, -7.615577697753906, -4.22581672668457, -0.8360562324523926, 2.553704261779785, 5.943465232849121, 9.33322525024414, 12.722986221313477, 16.112747192382812, 19.50250816345215, 22.892269134521484, 26.28203010559082, 29.671791076660156, 33.06155014038086, 36.45130920410156, 39.84107208251953, 43.2308349609375, 46.6205940246582]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 7.0, 8.0, 14.0, 12.0, 10.0, 10.0, 21.0, 27.0, 26.0, 17.0, 36.0, 33.0, 28.0, 27.0, 43.0, 50.0, 40.0, 42.0, 32.0, 42.0, 46.0, 40.0, 44.0, 40.0, 37.0, 34.0, 37.0, 23.0, 29.0, 21.0, 13.0, 16.0, 15.0, 13.0, 14.0, 4.0, 6.0, 8.0, 6.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.613853454589844, -34.32896423339844, -33.04407501220703, -31.759185791015625, -30.47429656982422, -29.189407348632812, -27.904516220092773, -26.619626998901367, -25.33473777770996, -24.049848556518555, -22.76495933532715, -21.480070114135742, -20.195178985595703, -18.910289764404297, -17.62540054321289, -16.340511322021484, -15.055622100830078, -13.770732879638672, -12.485843658447266, -11.200953483581543, -9.916064262390137, -8.63117504119873, -7.346285343170166, -6.061395645141602, -4.776506423950195, -3.49161696434021, -2.2067275047302246, -0.9218380451202393, 0.3630514144897461, 1.6479406356811523, 2.932830333709717, 4.217720031738281, 5.5026092529296875, 6.787498474121094, 8.0723876953125, 9.357277870178223, 10.642167091369629, 11.927056312561035, 13.211946487426758, 14.496835708618164, 15.78172492980957, 17.066614151000977, 18.351503372192383, 19.63639259338379, 20.921283721923828, 22.206172943115234, 23.49106216430664, 24.775951385498047, 26.060840606689453, 27.34572982788086, 28.630619049072266, 29.915508270263672, 31.200397491455078, 32.485286712646484, 33.77017593383789, 35.05506896972656, 36.33995819091797, 37.624847412109375, 38.90973663330078, 40.19462585449219, 41.479515075683594, 42.764404296875, 44.049293518066406, 45.33418273925781, 46.61907196044922]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 3.0, 5.0, 5.0, 6.0, 11.0, 7.0, 10.0, 10.0, 13.0, 22.0, 20.0, 22.0, 29.0, 29.0, 42.0, 30.0, 37.0, 36.0, 47.0, 27.0, 47.0, 37.0, 42.0, 35.0, 39.0, 27.0, 33.0, 41.0, 34.0, 28.0, 20.0, 25.0, 29.0, 22.0, 21.0, 12.0, 18.0, 5.0, 7.0, 15.0, 14.0, 5.0, 8.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.91015625, -4.76031494140625, -4.6104736328125, -4.46063232421875, -4.310791015625, -4.16094970703125, -4.0111083984375, -3.86126708984375, -3.71142578125, -3.56158447265625, -3.4117431640625, -3.26190185546875, -3.112060546875, -2.96221923828125, -2.8123779296875, -2.66253662109375, -2.5126953125, -2.36285400390625, -2.2130126953125, -2.06317138671875, -1.913330078125, -1.76348876953125, -1.6136474609375, -1.46380615234375, -1.31396484375, -1.16412353515625, -1.0142822265625, -0.86444091796875, -0.714599609375, -0.56475830078125, -0.4149169921875, -0.26507568359375, -0.115234375, 0.03460693359375, 0.1844482421875, 0.33428955078125, 0.484130859375, 0.63397216796875, 0.7838134765625, 0.93365478515625, 1.08349609375, 1.23333740234375, 1.3831787109375, 1.53302001953125, 1.682861328125, 1.83270263671875, 1.9825439453125, 2.13238525390625, 2.2822265625, 2.43206787109375, 2.5819091796875, 2.73175048828125, 2.881591796875, 3.03143310546875, 3.1812744140625, 3.33111572265625, 3.48095703125, 3.63079833984375, 3.7806396484375, 3.93048095703125, 4.080322265625, 4.23016357421875, 4.3800048828125, 4.52984619140625, 4.6796875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 5.0, 2.0, 10.0, 8.0, 12.0, 23.0, 30.0, 46.0, 69.0, 85.0, 131.0, 212.0, 306.0, 449.0, 696.0, 1020.0, 1664.0, 2552.0, 4044.0, 6347.0, 10021.0, 15902.0, 26168.0, 45388.0, 79641.0, 144689.0, 232675.0, 202065.0, 115908.0, 63915.0, 35870.0, 21936.0, 13312.0, 8351.0, 5350.0, 3394.0, 2128.0, 1411.0, 874.0, 619.0, 391.0, 262.0, 174.0, 128.0, 92.0, 54.0, 41.0, 32.0, 17.0, 12.0, 9.0, 8.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.65380859375, -0.6332550048828125, -0.612701416015625, -0.5921478271484375, -0.57159423828125, -0.5510406494140625, -0.530487060546875, -0.5099334716796875, -0.4893798828125, -0.4688262939453125, -0.448272705078125, -0.4277191162109375, -0.40716552734375, -0.3866119384765625, -0.366058349609375, -0.3455047607421875, -0.324951171875, -0.3043975830078125, -0.283843994140625, -0.2632904052734375, -0.24273681640625, -0.2221832275390625, -0.201629638671875, -0.1810760498046875, -0.1605224609375, -0.1399688720703125, -0.119415283203125, -0.0988616943359375, -0.07830810546875, -0.0577545166015625, -0.037200927734375, -0.0166473388671875, 0.00390625, 0.0244598388671875, 0.045013427734375, 0.0655670166015625, 0.08612060546875, 0.1066741943359375, 0.127227783203125, 0.1477813720703125, 0.1683349609375, 0.1888885498046875, 0.209442138671875, 0.2299957275390625, 0.25054931640625, 0.2711029052734375, 0.291656494140625, 0.3122100830078125, 0.332763671875, 0.3533172607421875, 0.373870849609375, 0.3944244384765625, 0.41497802734375, 0.4355316162109375, 0.456085205078125, 0.4766387939453125, 0.4971923828125, 0.5177459716796875, 0.538299560546875, 0.5588531494140625, 0.57940673828125, 0.5999603271484375, 0.620513916015625, 0.6410675048828125, 0.66162109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 2.0, 7.0, 7.0, 5.0, 13.0, 14.0, 18.0, 16.0, 20.0, 23.0, 23.0, 28.0, 39.0, 33.0, 48.0, 37.0, 43.0, 47.0, 49.0, 1065.0, 36.0, 39.0, 39.0, 44.0, 49.0, 43.0, 30.0, 27.0, 23.0, 34.0, 24.0, 23.0, 18.0, 9.0, 8.0, 11.0, 6.0, 4.0, 1.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.556640625, -3.448760986328125, -3.34088134765625, -3.233001708984375, -3.1251220703125, -3.017242431640625, -2.90936279296875, -2.801483154296875, -2.693603515625, -2.585723876953125, -2.47784423828125, -2.369964599609375, -2.2620849609375, -2.154205322265625, -2.04632568359375, -1.938446044921875, -1.83056640625, -1.722686767578125, -1.61480712890625, -1.506927490234375, -1.3990478515625, -1.291168212890625, -1.18328857421875, -1.075408935546875, -0.967529296875, -0.859649658203125, -0.75177001953125, -0.643890380859375, -0.5360107421875, -0.428131103515625, -0.32025146484375, -0.212371826171875, -0.1044921875, 0.003387451171875, 0.11126708984375, 0.219146728515625, 0.3270263671875, 0.434906005859375, 0.54278564453125, 0.650665283203125, 0.758544921875, 0.866424560546875, 0.97430419921875, 1.082183837890625, 1.1900634765625, 1.297943115234375, 1.40582275390625, 1.513702392578125, 1.62158203125, 1.729461669921875, 1.83734130859375, 1.945220947265625, 2.0531005859375, 2.160980224609375, 2.26885986328125, 2.376739501953125, 2.484619140625, 2.592498779296875, 2.70037841796875, 2.808258056640625, 2.9161376953125, 3.024017333984375, 3.13189697265625, 3.239776611328125, 3.34765625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 13.0, 23.0, 22.0, 37.0, 37.0, 84.0, 136.0, 205.0, 278.0, 402.0, 679.0, 1054.0, 1681.0, 2792.0, 4728.0, 8064.0, 14166.0, 25675.0, 48062.0, 93858.0, 176564.0, 1301298.0, 193307.0, 104595.0, 53122.0, 28260.0, 15766.0, 8812.0, 5282.0, 3129.0, 1966.0, 1121.0, 660.0, 437.0, 264.0, 184.0, 139.0, 66.0, 62.0, 21.0, 27.0, 11.0, 14.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.62548828125, -0.6050338745117188, -0.5845794677734375, -0.5641250610351562, -0.543670654296875, -0.5232162475585938, -0.5027618408203125, -0.48230743408203125, -0.46185302734375, -0.44139862060546875, -0.4209442138671875, -0.40048980712890625, -0.380035400390625, -0.35958099365234375, -0.3391265869140625, -0.31867218017578125, -0.2982177734375, -0.27776336669921875, -0.2573089599609375, -0.23685455322265625, -0.216400146484375, -0.19594573974609375, -0.1754913330078125, -0.15503692626953125, -0.13458251953125, -0.11412811279296875, -0.0936737060546875, -0.07321929931640625, -0.052764892578125, -0.03231048583984375, -0.0118560791015625, 0.00859832763671875, 0.029052734375, 0.04950714111328125, 0.0699615478515625, 0.09041595458984375, 0.110870361328125, 0.13132476806640625, 0.1517791748046875, 0.17223358154296875, 0.19268798828125, 0.21314239501953125, 0.2335968017578125, 0.25405120849609375, 0.274505615234375, 0.29496002197265625, 0.3154144287109375, 0.33586883544921875, 0.3563232421875, 0.37677764892578125, 0.3972320556640625, 0.41768646240234375, 0.438140869140625, 0.45859527587890625, 0.4790496826171875, 0.49950408935546875, 0.51995849609375, 0.5404129028320312, 0.5608673095703125, 0.5813217163085938, 0.601776123046875, 0.6222305297851562, 0.6426849365234375, 0.6631393432617188, 0.68359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 8.0, 9.0, 10.0, 10.0, 23.0, 17.0, 13.0, 16.0, 12.0, 29.0, 28.0, 33.0, 33.0, 38.0, 30.0, 31.0, 42.0, 43.0, 38.0, 29.0, 45.0, 43.0, 39.0, 33.0, 34.0, 40.0, 33.0, 37.0, 35.0, 25.0, 31.0, 21.0, 20.0, 11.0, 14.0, 14.0, 9.0, 8.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0009169578552246094, -0.0008850321173667908, -0.0008531063795089722, -0.0008211806416511536, -0.000789254903793335, -0.0007573291659355164, -0.0007254034280776978, -0.0006934776902198792, -0.0006615519523620605, -0.0006296262145042419, -0.0005977004766464233, -0.0005657747387886047, -0.0005338490009307861, -0.0005019232630729675, -0.0004699975252151489, -0.0004380717873573303, -0.0004061460494995117, -0.0003742203116416931, -0.0003422945737838745, -0.0003103688359260559, -0.0002784430980682373, -0.0002465173602104187, -0.0002145916223526001, -0.0001826658844947815, -0.0001507401466369629, -0.00011881440877914429, -8.688867092132568e-05, -5.496293306350708e-05, -2.3037195205688477e-05, 8.888542652130127e-06, 4.081428050994873e-05, 7.274001836776733e-05, 0.00010466575622558594, 0.00013659149408340454, 0.00016851723194122314, 0.00020044296979904175, 0.00023236870765686035, 0.00026429444551467896, 0.00029622018337249756, 0.00032814592123031616, 0.00036007165908813477, 0.00039199739694595337, 0.00042392313480377197, 0.0004558488726615906, 0.0004877746105194092, 0.0005197003483772278, 0.0005516260862350464, 0.000583551824092865, 0.0006154775619506836, 0.0006474032998085022, 0.0006793290376663208, 0.0007112547755241394, 0.000743180513381958, 0.0007751062512397766, 0.0008070319890975952, 0.0008389577269554138, 0.0008708834648132324, 0.000902809202671051, 0.0009347349405288696, 0.0009666606783866882, 0.0009985864162445068, 0.0010305121541023254, 0.001062437891960144, 0.0010943636298179626, 0.0011262893676757812]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 4.0, 9.0, 6.0, 5.0, 11.0, 18.0, 12.0, 20.0, 18.0, 21.0, 30.0, 37.0, 46.0, 49.0, 74.0, 138.0, 193.0, 307.0, 541.0, 1457.0, 458938.0, 583438.0, 1568.0, 583.0, 318.0, 210.0, 106.0, 79.0, 57.0, 43.0, 41.0, 35.0, 19.0, 19.0, 17.0, 15.0, 15.0, 7.0, 11.0, 9.0, 9.0, 4.0, 5.0, 5.0, 0.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.024078369140625, -0.023370742797851562, -0.022663116455078125, -0.021955490112304688, -0.02124786376953125, -0.020540237426757812, -0.019832611083984375, -0.019124984741210938, -0.0184173583984375, -0.017709732055664062, -0.017002105712890625, -0.016294479370117188, -0.01558685302734375, -0.014879226684570312, -0.014171600341796875, -0.013463973999023438, -0.01275634765625, -0.012048721313476562, -0.011341094970703125, -0.010633468627929688, -0.00992584228515625, -0.009218215942382812, -0.008510589599609375, -0.0078029632568359375, -0.0070953369140625, -0.0063877105712890625, -0.005680084228515625, -0.0049724578857421875, -0.00426483154296875, -0.0035572052001953125, -0.002849578857421875, -0.0021419525146484375, -0.001434326171875, -0.0007266998291015625, -1.9073486328125e-05, 0.0006885528564453125, 0.00139617919921875, 0.0021038055419921875, 0.002811431884765625, 0.0035190582275390625, 0.0042266845703125, 0.0049343109130859375, 0.005641937255859375, 0.0063495635986328125, 0.00705718994140625, 0.0077648162841796875, 0.008472442626953125, 0.009180068969726562, 0.0098876953125, 0.010595321655273438, 0.011302947998046875, 0.012010574340820312, 0.01271820068359375, 0.013425827026367188, 0.014133453369140625, 0.014841079711914062, 0.0155487060546875, 0.016256332397460938, 0.016963958740234375, 0.017671585083007812, 0.01837921142578125, 0.019086837768554688, 0.019794464111328125, 0.020502090454101562, 0.021209716796875]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 12.0, 24.0, 71.0, 202.0, 292.0, 246.0, 108.0, 42.0, 13.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004909675917588174, -0.0004270319768693298, -0.0003630963619798422, -0.00029916074709035456, -0.00023522513220086694, -0.0001712895173113793, -0.00010735390242189169, -4.3418287532404065e-05, 2.051732735708356e-05, 8.445294224657118e-05, 0.0001483885571360588, 0.00021232417202554643, 0.00027625978691503406, 0.0003401954018045217, 0.0004041310166940093, 0.00046806663158349693, 0.0005320022464729846, 0.0005959378322586417, 0.0006598734762519598, 0.0007238091202452779, 0.000787744706030935, 0.0008516802918165922, 0.0009156159358099103, 0.0009795515798032284, 0.0010434871073812246, 0.0011074227513745427, 0.0011713583953678608, 0.001235293922945857, 0.0012992295669391751, 0.0013631652109324932, 0.0014271007385104895, 0.0014910363825038075, 0.0015549720264971256, 0.0016189076704904437, 0.0016828433144837618, 0.001746778842061758, 0.0018107144860550761, 0.0018746501300483942, 0.0019385856576263905, 0.0020025214180350304, 0.0020664569456130266, 0.002130392473191023, 0.0021943282335996628, 0.002258263761177659, 0.0023221992887556553, 0.002386135049164295, 0.0024500705767422915, 0.0025140063371509314, 0.0025779418647289276, 0.002641877392306924, 0.0027058131527155638, 0.00276974868029356, 0.0028336844407022, 0.002897619968280196, 0.0029615554958581924, 0.0030254912562668324, 0.0030894267838448286, 0.003153362311422825, 0.0032172980718314648, 0.003281233599409461, 0.0033451691269874573, 0.003409104887396097, 0.0034730404149740934, 0.0035369761753827333, 0.0036009117029607296]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 11.0, 8.0, 11.0, 4.0, 17.0, 20.0, 20.0, 21.0, 25.0, 27.0, 28.0, 27.0, 28.0, 24.0, 38.0, 31.0, 43.0, 43.0, 42.0, 46.0, 53.0, 44.0, 47.0, 36.0, 29.0, 46.0, 23.0, 30.0, 28.0, 25.0, 22.0, 15.0, 16.0, 19.0, 12.0, 7.0, 11.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006652474403381348, -0.0006439900025725365, -0.0006227325648069382, -0.0006014751270413399, -0.0005802176892757416, -0.0005589602515101433, -0.000537702813744545, -0.0005164453759789467, -0.0004951879382133484, -0.0004739305004477501, -0.0004526730626821518, -0.0004314156249165535, -0.0004101581871509552, -0.0003889007493853569, -0.0003676433116197586, -0.0003463858738541603, -0.000325128436088562, -0.0003038709983229637, -0.0002826135605573654, -0.0002613561227917671, -0.00024009868502616882, -0.00021884124726057053, -0.00019758380949497223, -0.00017632637172937393, -0.00015506893396377563, -0.00013381149619817734, -0.00011255405843257904, -9.129662066698074e-05, -7.003918290138245e-05, -4.878174513578415e-05, -2.7524307370185852e-05, -6.266869604587555e-06, 1.4990568161010742e-05, 3.624800592660904e-05, 5.7505443692207336e-05, 7.876288145780563e-05, 0.00010002031922340393, 0.00012127775698900223, 0.00014253519475460052, 0.00016379263252019882, 0.00018505007028579712, 0.00020630750805139542, 0.0002275649458169937, 0.000248822383582592, 0.0002700798213481903, 0.0002913372591137886, 0.0003125946968793869, 0.0003338521346449852, 0.0003551095724105835, 0.0003763670101761818, 0.0003976244479417801, 0.0004188818857073784, 0.0004401393234729767, 0.000461396761238575, 0.0004826541990041733, 0.0005039116367697716, 0.0005251690745353699, 0.0005464265123009682, 0.0005676839500665665, 0.0005889413878321648, 0.0006101988255977631, 0.0006314562633633614, 0.0006527137011289597, 0.000673971138894558, 0.0006952285766601562]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 4.0, 5.0, 5.0, 6.0, 11.0, 7.0, 10.0, 10.0, 12.0, 23.0, 19.0, 22.0, 30.0, 28.0, 42.0, 30.0, 37.0, 37.0, 46.0, 28.0, 47.0, 37.0, 41.0, 36.0, 39.0, 27.0, 33.0, 41.0, 34.0, 28.0, 19.0, 26.0, 28.0, 23.0, 20.0, 13.0, 18.0, 5.0, 7.0, 15.0, 14.0, 5.0, 8.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.9140625, -4.76416015625, -4.6142578125, -4.46435546875, -4.314453125, -4.16455078125, -4.0146484375, -3.86474609375, -3.71484375, -3.56494140625, -3.4150390625, -3.26513671875, -3.115234375, -2.96533203125, -2.8154296875, -2.66552734375, -2.515625, -2.36572265625, -2.2158203125, -2.06591796875, -1.916015625, -1.76611328125, -1.6162109375, -1.46630859375, -1.31640625, -1.16650390625, -1.0166015625, -0.86669921875, -0.716796875, -0.56689453125, -0.4169921875, -0.26708984375, -0.1171875, 0.03271484375, 0.1826171875, 0.33251953125, 0.482421875, 0.63232421875, 0.7822265625, 0.93212890625, 1.08203125, 1.23193359375, 1.3818359375, 1.53173828125, 1.681640625, 1.83154296875, 1.9814453125, 2.13134765625, 2.28125, 2.43115234375, 2.5810546875, 2.73095703125, 2.880859375, 3.03076171875, 3.1806640625, 3.33056640625, 3.48046875, 3.63037109375, 3.7802734375, 3.93017578125, 4.080078125, 4.22998046875, 4.3798828125, 4.52978515625, 4.6796875]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 2.0, 3.0, 9.0, 4.0, 10.0, 13.0, 13.0, 24.0, 31.0, 40.0, 72.0, 94.0, 124.0, 248.0, 352.0, 577.0, 1070.0, 2025.0, 3723.0, 7369.0, 15831.0, 38214.0, 102648.0, 322113.0, 360489.0, 116794.0, 41929.0, 17609.0, 8005.0, 4038.0, 2130.0, 1151.0, 670.0, 380.0, 269.0, 152.0, 90.0, 76.0, 47.0, 28.0, 24.0, 13.0, 17.0, 11.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0, -3.878997802734375, -3.75799560546875, -3.636993408203125, -3.5159912109375, -3.394989013671875, -3.27398681640625, -3.152984619140625, -3.031982421875, -2.910980224609375, -2.78997802734375, -2.668975830078125, -2.5479736328125, -2.426971435546875, -2.30596923828125, -2.184967041015625, -2.06396484375, -1.942962646484375, -1.82196044921875, -1.700958251953125, -1.5799560546875, -1.458953857421875, -1.33795166015625, -1.216949462890625, -1.095947265625, -0.974945068359375, -0.85394287109375, -0.732940673828125, -0.6119384765625, -0.490936279296875, -0.36993408203125, -0.248931884765625, -0.1279296875, -0.006927490234375, 0.11407470703125, 0.235076904296875, 0.3560791015625, 0.477081298828125, 0.59808349609375, 0.719085693359375, 0.840087890625, 0.961090087890625, 1.08209228515625, 1.203094482421875, 1.3240966796875, 1.445098876953125, 1.56610107421875, 1.687103271484375, 1.80810546875, 1.929107666015625, 2.05010986328125, 2.171112060546875, 2.2921142578125, 2.413116455078125, 2.53411865234375, 2.655120849609375, 2.776123046875, 2.897125244140625, 3.01812744140625, 3.139129638671875, 3.2601318359375, 3.381134033203125, 3.50213623046875, 3.623138427734375, 3.744140625]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 3.0, 2.0, 9.0, 5.0, 7.0, 13.0, 17.0, 18.0, 21.0, 29.0, 27.0, 39.0, 31.0, 37.0, 43.0, 56.0, 61.0, 113.0, 1644.0, 354.0, 97.0, 65.0, 56.0, 63.0, 37.0, 34.0, 37.0, 36.0, 14.0, 16.0, 21.0, 13.0, 14.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.515625, -23.79150390625, -23.0673828125, -22.34326171875, -21.619140625, -20.89501953125, -20.1708984375, -19.44677734375, -18.72265625, -17.99853515625, -17.2744140625, -16.55029296875, -15.826171875, -15.10205078125, -14.3779296875, -13.65380859375, -12.9296875, -12.20556640625, -11.4814453125, -10.75732421875, -10.033203125, -9.30908203125, -8.5849609375, -7.86083984375, -7.13671875, -6.41259765625, -5.6884765625, -4.96435546875, -4.240234375, -3.51611328125, -2.7919921875, -2.06787109375, -1.34375, -0.61962890625, 0.1044921875, 0.82861328125, 1.552734375, 2.27685546875, 3.0009765625, 3.72509765625, 4.44921875, 5.17333984375, 5.8974609375, 6.62158203125, 7.345703125, 8.06982421875, 8.7939453125, 9.51806640625, 10.2421875, 10.96630859375, 11.6904296875, 12.41455078125, 13.138671875, 13.86279296875, 14.5869140625, 15.31103515625, 16.03515625, 16.75927734375, 17.4833984375, 18.20751953125, 18.931640625, 19.65576171875, 20.3798828125, 21.10400390625, 21.828125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 4.0, 11.0, 15.0, 17.0, 37.0, 23.0, 33.0, 44.0, 72.0, 84.0, 144.0, 229.0, 344.0, 706.0, 5401.0, 3085552.0, 50520.0, 1198.0, 399.0, 289.0, 164.0, 98.0, 54.0, 59.0, 49.0, 44.0, 30.0, 20.0, 18.0, 10.0, 5.0, 7.0, 10.0, 0.0, 5.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.28125, -41.82421875, -40.3671875, -38.91015625, -37.453125, -35.99609375, -34.5390625, -33.08203125, -31.625, -30.16796875, -28.7109375, -27.25390625, -25.796875, -24.33984375, -22.8828125, -21.42578125, -19.96875, -18.51171875, -17.0546875, -15.59765625, -14.140625, -12.68359375, -11.2265625, -9.76953125, -8.3125, -6.85546875, -5.3984375, -3.94140625, -2.484375, -1.02734375, 0.4296875, 1.88671875, 3.34375, 4.80078125, 6.2578125, 7.71484375, 9.171875, 10.62890625, 12.0859375, 13.54296875, 15.0, 16.45703125, 17.9140625, 19.37109375, 20.828125, 22.28515625, 23.7421875, 25.19921875, 26.65625, 28.11328125, 29.5703125, 31.02734375, 32.484375, 33.94140625, 35.3984375, 36.85546875, 38.3125, 39.76953125, 41.2265625, 42.68359375, 44.140625, 45.59765625, 47.0546875, 48.51171875, 49.96875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 204.0, 687.0, 118.0, 5.0], "bins": [-220.53131103515625, -216.93911743164062, -213.34690856933594, -209.7547149658203, -206.16250610351562, -202.5703125, -198.9781036376953, -195.3859100341797, -191.793701171875, -188.20150756835938, -184.6092987060547, -181.01710510253906, -177.42489624023438, -173.83270263671875, -170.24049377441406, -166.64830017089844, -163.0561065673828, -159.4639129638672, -155.8717041015625, -152.27951049804688, -148.6873016357422, -145.09510803222656, -141.50289916992188, -137.91070556640625, -134.31849670410156, -130.72630310058594, -127.13409423828125, -123.5418930053711, -119.94969177246094, -116.35749816894531, -112.76528930664062, -109.173095703125, -105.58089447021484, -101.98869323730469, -98.39649200439453, -94.80429077148438, -91.21208953857422, -87.61988830566406, -84.02769470214844, -80.43549346923828, -76.84329223632812, -73.25109100341797, -69.65888977050781, -66.06668853759766, -62.474491119384766, -58.88228988647461, -55.29008865356445, -51.69789123535156, -48.10568618774414, -44.513484954833984, -40.92128372192383, -37.32908630371094, -33.73688507080078, -30.144683837890625, -26.55248260498047, -22.960283279418945, -19.36808204650879, -15.77588176727295, -12.18368148803711, -8.591480255126953, -4.999279975891113, -1.4070796966552734, 2.185121536254883, 5.777320861816406, 9.369522094726562]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 7.0, 3.0, 6.0, 12.0, 9.0, 12.0, 11.0, 18.0, 19.0, 29.0, 23.0, 27.0, 25.0, 32.0, 35.0, 39.0, 43.0, 61.0, 37.0, 39.0, 30.0, 51.0, 43.0, 43.0, 29.0, 41.0, 37.0, 29.0, 22.0, 30.0, 25.0, 25.0, 22.0, 18.0, 20.0, 11.0, 14.0, 4.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-51.35515213012695, -49.874122619628906, -48.393096923828125, -46.91206741333008, -45.4310417175293, -43.95001220703125, -42.46898651123047, -40.98795700073242, -39.50693130493164, -38.025901794433594, -36.54487609863281, -35.063846588134766, -33.582820892333984, -32.10179138183594, -30.620765686035156, -29.13973617553711, -27.658708572387695, -26.17768096923828, -24.696653366088867, -23.215625762939453, -21.73459815979004, -20.253570556640625, -18.772541046142578, -17.291515350341797, -15.810486793518066, -14.329459190368652, -12.848431587219238, -11.367403030395508, -9.886375427246094, -8.40534782409668, -6.924320220947266, -5.443292617797852, -3.9622650146484375, -2.4812374114990234, -1.0002095699310303, 0.4808182716369629, 1.961845874786377, 3.442873477935791, 4.923901557922363, 6.404929161071777, 7.885956764221191, 9.366984367370605, 10.84801197052002, 12.32904052734375, 13.810068130493164, 15.291095733642578, 16.772123336791992, 18.253150939941406, 19.73417854309082, 21.215206146240234, 22.69623374938965, 24.177261352539062, 25.658288955688477, 27.13931655883789, 28.620346069335938, 30.10137176513672, 31.582401275634766, 33.06343078613281, 34.544456481933594, 36.02548599243164, 37.50651168823242, 38.98754119873047, 40.46856689453125, 41.9495964050293, 43.43062210083008]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 2.0, 5.0, 6.0, 7.0, 4.0, 9.0, 4.0, 3.0, 11.0, 11.0, 17.0, 20.0, 12.0, 16.0, 21.0, 33.0, 35.0, 37.0, 46.0, 27.0, 36.0, 41.0, 37.0, 49.0, 40.0, 39.0, 31.0, 26.0, 34.0, 41.0, 38.0, 22.0, 25.0, 33.0, 20.0, 34.0, 19.0, 17.0, 14.0, 11.0, 13.0, 11.0, 12.0, 8.0, 7.0, 6.0, 3.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.02734375, -4.872314453125, -4.71728515625, -4.562255859375, -4.4072265625, -4.252197265625, -4.09716796875, -3.942138671875, -3.787109375, -3.632080078125, -3.47705078125, -3.322021484375, -3.1669921875, -3.011962890625, -2.85693359375, -2.701904296875, -2.546875, -2.391845703125, -2.23681640625, -2.081787109375, -1.9267578125, -1.771728515625, -1.61669921875, -1.461669921875, -1.306640625, -1.151611328125, -0.99658203125, -0.841552734375, -0.6865234375, -0.531494140625, -0.37646484375, -0.221435546875, -0.06640625, 0.088623046875, 0.24365234375, 0.398681640625, 0.5537109375, 0.708740234375, 0.86376953125, 1.018798828125, 1.173828125, 1.328857421875, 1.48388671875, 1.638916015625, 1.7939453125, 1.948974609375, 2.10400390625, 2.259033203125, 2.4140625, 2.569091796875, 2.72412109375, 2.879150390625, 3.0341796875, 3.189208984375, 3.34423828125, 3.499267578125, 3.654296875, 3.809326171875, 3.96435546875, 4.119384765625, 4.2744140625, 4.429443359375, 4.58447265625, 4.739501953125, 4.89453125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 4.0, 5.0, 6.0, 6.0, 9.0, 7.0, 16.0, 16.0, 15.0, 21.0, 23.0, 19.0, 43.0, 59.0, 63.0, 110.0, 142.0, 257.0, 795.0, 7528.0, 492279.0, 3607952.0, 80905.0, 2757.0, 484.0, 219.0, 130.0, 87.0, 57.0, 41.0, 40.0, 35.0, 26.0, 20.0, 12.0, 7.0, 16.0, 11.0, 9.0, 11.0, 13.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-27.828125, -27.017333984375, -26.20654296875, -25.395751953125, -24.5849609375, -23.774169921875, -22.96337890625, -22.152587890625, -21.341796875, -20.531005859375, -19.72021484375, -18.909423828125, -18.0986328125, -17.287841796875, -16.47705078125, -15.666259765625, -14.85546875, -14.044677734375, -13.23388671875, -12.423095703125, -11.6123046875, -10.801513671875, -9.99072265625, -9.179931640625, -8.369140625, -7.558349609375, -6.74755859375, -5.936767578125, -5.1259765625, -4.315185546875, -3.50439453125, -2.693603515625, -1.8828125, -1.072021484375, -0.26123046875, 0.549560546875, 1.3603515625, 2.171142578125, 2.98193359375, 3.792724609375, 4.603515625, 5.414306640625, 6.22509765625, 7.035888671875, 7.8466796875, 8.657470703125, 9.46826171875, 10.279052734375, 11.08984375, 11.900634765625, 12.71142578125, 13.522216796875, 14.3330078125, 15.143798828125, 15.95458984375, 16.765380859375, 17.576171875, 18.386962890625, 19.19775390625, 20.008544921875, 20.8193359375, 21.630126953125, 22.44091796875, 23.251708984375, 24.0625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 5.0, 17.0, 24.0, 23.0, 40.0, 61.0, 82.0, 114.0, 188.0, 243.0, 331.0, 434.0, 518.0, 507.0, 412.0, 324.0, 229.0, 167.0, 111.0, 78.0, 56.0, 37.0, 30.0, 11.0, 8.0, 4.0, 4.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.734375, -16.2930908203125, -15.851806640625, -15.4105224609375, -14.96923828125, -14.5279541015625, -14.086669921875, -13.6453857421875, -13.2041015625, -12.7628173828125, -12.321533203125, -11.8802490234375, -11.43896484375, -10.9976806640625, -10.556396484375, -10.1151123046875, -9.673828125, -9.2325439453125, -8.791259765625, -8.3499755859375, -7.90869140625, -7.4674072265625, -7.026123046875, -6.5848388671875, -6.1435546875, -5.7022705078125, -5.260986328125, -4.8197021484375, -4.37841796875, -3.9371337890625, -3.495849609375, -3.0545654296875, -2.61328125, -2.1719970703125, -1.730712890625, -1.2894287109375, -0.84814453125, -0.4068603515625, 0.034423828125, 0.4757080078125, 0.9169921875, 1.3582763671875, 1.799560546875, 2.2408447265625, 2.68212890625, 3.1234130859375, 3.564697265625, 4.0059814453125, 4.447265625, 4.8885498046875, 5.329833984375, 5.7711181640625, 6.21240234375, 6.6536865234375, 7.094970703125, 7.5362548828125, 7.9775390625, 8.4188232421875, 8.860107421875, 9.3013916015625, 9.74267578125, 10.1839599609375, 10.625244140625, 11.0665283203125, 11.5078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 15.0, 20.0, 21.0, 23.0, 51.0, 62.0, 99.0, 143.0, 220.0, 321.0, 650.0, 2994.0, 174343.0, 3971528.0, 40686.0, 1696.0, 526.0, 290.0, 175.0, 124.0, 86.0, 71.0, 52.0, 31.0, 15.0, 11.0, 9.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.71875, -52.10888671875, -50.4990234375, -48.88916015625, -47.279296875, -45.66943359375, -44.0595703125, -42.44970703125, -40.83984375, -39.22998046875, -37.6201171875, -36.01025390625, -34.400390625, -32.79052734375, -31.1806640625, -29.57080078125, -27.9609375, -26.35107421875, -24.7412109375, -23.13134765625, -21.521484375, -19.91162109375, -18.3017578125, -16.69189453125, -15.08203125, -13.47216796875, -11.8623046875, -10.25244140625, -8.642578125, -7.03271484375, -5.4228515625, -3.81298828125, -2.203125, -0.59326171875, 1.0166015625, 2.62646484375, 4.236328125, 5.84619140625, 7.4560546875, 9.06591796875, 10.67578125, 12.28564453125, 13.8955078125, 15.50537109375, 17.115234375, 18.72509765625, 20.3349609375, 21.94482421875, 23.5546875, 25.16455078125, 26.7744140625, 28.38427734375, 29.994140625, 31.60400390625, 33.2138671875, 34.82373046875, 36.43359375, 38.04345703125, 39.6533203125, 41.26318359375, 42.873046875, 44.48291015625, 46.0927734375, 47.70263671875, 49.3125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 11.0, 21.0, 52.0, 89.0, 137.0, 177.0, 180.0, 160.0, 97.0, 56.0, 28.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.70643615722656, -142.91151428222656, -140.1165771484375, -137.3216552734375, -134.5267333984375, -131.7318115234375, -128.9368896484375, -126.14195251464844, -123.34703063964844, -120.55210876464844, -117.7571792602539, -114.96224975585938, -112.16732788085938, -109.37240600585938, -106.57747650146484, -103.78254699707031, -100.98762512207031, -98.19270324707031, -95.39777374267578, -92.60284423828125, -89.80792236328125, -87.01300048828125, -84.21807098388672, -81.42314147949219, -78.62821960449219, -75.83329772949219, -73.03836822509766, -70.24343872070312, -67.44851684570312, -64.65359497070312, -61.858665466308594, -59.06373977661133, -56.26881408691406, -53.4738883972168, -50.67896270751953, -47.884037017822266, -45.089111328125, -42.294185638427734, -39.49925994873047, -36.7043342590332, -33.90940856933594, -31.114482879638672, -28.319557189941406, -25.52463150024414, -22.729705810546875, -19.93478012084961, -17.139854431152344, -14.344928741455078, -11.550003051757812, -8.755077362060547, -5.960151672363281, -3.1652259826660156, -0.37030029296875, 2.4246253967285156, 5.219551086425781, 8.014476776123047, 10.809402465820312, 13.604328155517578, 16.399253845214844, 19.19417953491211, 21.989105224609375, 24.78403091430664, 27.578956604003906, 30.373882293701172, 33.16880798339844]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 11.0, 5.0, 9.0, 15.0, 10.0, 22.0, 19.0, 27.0, 31.0, 38.0, 43.0, 44.0, 50.0, 48.0, 36.0, 57.0, 55.0, 49.0, 59.0, 31.0, 33.0, 45.0, 43.0, 31.0, 33.0, 27.0, 21.0, 13.0, 14.0, 19.0, 13.0, 10.0, 11.0, 10.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.098079681396484, -41.73369216918945, -40.36930847167969, -39.004920959472656, -37.640533447265625, -36.27614974975586, -34.91176223754883, -33.54737854003906, -32.18299102783203, -30.818605422973633, -29.454219818115234, -28.089832305908203, -26.725446701049805, -25.361061096191406, -23.996673583984375, -22.632287979125977, -21.267902374267578, -19.90351676940918, -18.53913116455078, -17.17474365234375, -15.810358047485352, -14.445972442626953, -13.081585884094238, -11.717199325561523, -10.352813720703125, -8.988428115844727, -7.624041557312012, -6.259655475616455, -4.895269393920898, -3.530883312225342, -2.166497230529785, -0.8021106719970703, 0.5622711181640625, 1.9266571998596191, 3.291043281555176, 4.655429363250732, 6.019815444946289, 7.384201526641846, 8.748587608337402, 10.112974166870117, 11.477359771728516, 12.841745376586914, 14.206131935119629, 15.570518493652344, 16.934904098510742, 18.29928970336914, 19.663677215576172, 21.02806282043457, 22.39244842529297, 23.756834030151367, 25.121219635009766, 26.485607147216797, 27.849992752075195, 29.214378356933594, 30.578765869140625, 31.943151473999023, 33.30753707885742, 34.67192459106445, 36.03630828857422, 37.40069580078125, 38.76508331298828, 40.12946701049805, 41.49385452270508, 42.858238220214844, 44.222625732421875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 7.0, 3.0, 4.0, 9.0, 7.0, 5.0, 14.0, 13.0, 12.0, 18.0, 14.0, 16.0, 18.0, 18.0, 27.0, 33.0, 37.0, 38.0, 35.0, 55.0, 42.0, 41.0, 42.0, 35.0, 30.0, 23.0, 36.0, 37.0, 35.0, 27.0, 37.0, 27.0, 23.0, 25.0, 22.0, 26.0, 15.0, 20.0, 9.0, 11.0, 9.0, 9.0, 8.0, 13.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.109375, -4.9544677734375, -4.799560546875, -4.6446533203125, -4.48974609375, -4.3348388671875, -4.179931640625, -4.0250244140625, -3.8701171875, -3.7152099609375, -3.560302734375, -3.4053955078125, -3.25048828125, -3.0955810546875, -2.940673828125, -2.7857666015625, -2.630859375, -2.4759521484375, -2.321044921875, -2.1661376953125, -2.01123046875, -1.8563232421875, -1.701416015625, -1.5465087890625, -1.3916015625, -1.2366943359375, -1.081787109375, -0.9268798828125, -0.77197265625, -0.6170654296875, -0.462158203125, -0.3072509765625, -0.15234375, 0.0025634765625, 0.157470703125, 0.3123779296875, 0.46728515625, 0.6221923828125, 0.777099609375, 0.9320068359375, 1.0869140625, 1.2418212890625, 1.396728515625, 1.5516357421875, 1.70654296875, 1.8614501953125, 2.016357421875, 2.1712646484375, 2.326171875, 2.4810791015625, 2.635986328125, 2.7908935546875, 2.94580078125, 3.1007080078125, 3.255615234375, 3.4105224609375, 3.5654296875, 3.7203369140625, 3.875244140625, 4.0301513671875, 4.18505859375, 4.3399658203125, 4.494873046875, 4.6497802734375, 4.8046875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 12.0, 12.0, 13.0, 27.0, 35.0, 73.0, 104.0, 132.0, 222.0, 328.0, 512.0, 828.0, 1263.0, 2121.0, 3242.0, 5288.0, 8715.0, 14082.0, 23875.0, 41033.0, 72641.0, 133654.0, 226305.0, 219903.0, 127097.0, 69079.0, 39441.0, 22759.0, 13732.0, 8159.0, 5225.0, 3152.0, 1886.0, 1268.0, 836.0, 529.0, 362.0, 209.0, 123.0, 93.0, 66.0, 43.0, 20.0, 20.0, 18.0, 8.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-0.81005859375, -0.7868881225585938, -0.7637176513671875, -0.7405471801757812, -0.717376708984375, -0.6942062377929688, -0.6710357666015625, -0.6478652954101562, -0.62469482421875, -0.6015243530273438, -0.5783538818359375, -0.5551834106445312, -0.532012939453125, -0.5088424682617188, -0.4856719970703125, -0.46250152587890625, -0.4393310546875, -0.41616058349609375, -0.3929901123046875, -0.36981964111328125, -0.346649169921875, -0.32347869873046875, -0.3003082275390625, -0.27713775634765625, -0.25396728515625, -0.23079681396484375, -0.2076263427734375, -0.18445587158203125, -0.161285400390625, -0.13811492919921875, -0.1149444580078125, -0.09177398681640625, -0.068603515625, -0.04543304443359375, -0.0222625732421875, 0.00090789794921875, 0.024078369140625, 0.04724884033203125, 0.0704193115234375, 0.09358978271484375, 0.11676025390625, 0.13993072509765625, 0.1631011962890625, 0.18627166748046875, 0.209442138671875, 0.23261260986328125, 0.2557830810546875, 0.27895355224609375, 0.3021240234375, 0.32529449462890625, 0.3484649658203125, 0.37163543701171875, 0.394805908203125, 0.41797637939453125, 0.4411468505859375, 0.46431732177734375, 0.48748779296875, 0.5106582641601562, 0.5338287353515625, 0.5569992065429688, 0.580169677734375, 0.6033401489257812, 0.6265106201171875, 0.6496810913085938, 0.6728515625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 5.0, 5.0, 7.0, 14.0, 14.0, 12.0, 17.0, 23.0, 15.0, 25.0, 24.0, 26.0, 23.0, 26.0, 31.0, 47.0, 44.0, 45.0, 55.0, 30.0, 1068.0, 42.0, 29.0, 41.0, 39.0, 49.0, 33.0, 41.0, 28.0, 30.0, 15.0, 16.0, 18.0, 18.0, 20.0, 15.0, 8.0, 7.0, 4.0, 1.0, 2.0, 5.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.18359375, -3.07025146484375, -2.9569091796875, -2.84356689453125, -2.730224609375, -2.61688232421875, -2.5035400390625, -2.39019775390625, -2.27685546875, -2.16351318359375, -2.0501708984375, -1.93682861328125, -1.823486328125, -1.71014404296875, -1.5968017578125, -1.48345947265625, -1.3701171875, -1.25677490234375, -1.1434326171875, -1.03009033203125, -0.916748046875, -0.80340576171875, -0.6900634765625, -0.57672119140625, -0.46337890625, -0.35003662109375, -0.2366943359375, -0.12335205078125, -0.010009765625, 0.10333251953125, 0.2166748046875, 0.33001708984375, 0.443359375, 0.55670166015625, 0.6700439453125, 0.78338623046875, 0.896728515625, 1.01007080078125, 1.1234130859375, 1.23675537109375, 1.35009765625, 1.46343994140625, 1.5767822265625, 1.69012451171875, 1.803466796875, 1.91680908203125, 2.0301513671875, 2.14349365234375, 2.2568359375, 2.37017822265625, 2.4835205078125, 2.59686279296875, 2.710205078125, 2.82354736328125, 2.9368896484375, 3.05023193359375, 3.16357421875, 3.27691650390625, 3.3902587890625, 3.50360107421875, 3.616943359375, 3.73028564453125, 3.8436279296875, 3.95697021484375, 4.0703125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 6.0, 4.0, 7.0, 16.0, 20.0, 32.0, 50.0, 67.0, 112.0, 149.0, 240.0, 399.0, 625.0, 989.0, 1569.0, 2678.0, 4287.0, 7095.0, 11967.0, 20432.0, 35851.0, 65271.0, 120192.0, 205093.0, 1279142.0, 150696.0, 82607.0, 45203.0, 25421.0, 14717.0, 8529.0, 5182.0, 3260.0, 1931.0, 1153.0, 789.0, 495.0, 308.0, 185.0, 120.0, 98.0, 51.0, 26.0, 23.0, 19.0, 9.0, 6.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.64892578125, -0.6287689208984375, -0.608612060546875, -0.5884552001953125, -0.56829833984375, -0.5481414794921875, -0.527984619140625, -0.5078277587890625, -0.4876708984375, -0.4675140380859375, -0.447357177734375, -0.4272003173828125, -0.40704345703125, -0.3868865966796875, -0.366729736328125, -0.3465728759765625, -0.326416015625, -0.3062591552734375, -0.286102294921875, -0.2659454345703125, -0.24578857421875, -0.2256317138671875, -0.205474853515625, -0.1853179931640625, -0.1651611328125, -0.1450042724609375, -0.124847412109375, -0.1046905517578125, -0.08453369140625, -0.0643768310546875, -0.044219970703125, -0.0240631103515625, -0.00390625, 0.0162506103515625, 0.036407470703125, 0.0565643310546875, 0.07672119140625, 0.0968780517578125, 0.117034912109375, 0.1371917724609375, 0.1573486328125, 0.1775054931640625, 0.197662353515625, 0.2178192138671875, 0.23797607421875, 0.2581329345703125, 0.278289794921875, 0.2984466552734375, 0.318603515625, 0.3387603759765625, 0.358917236328125, 0.3790740966796875, 0.39923095703125, 0.4193878173828125, 0.439544677734375, 0.4597015380859375, 0.4798583984375, 0.5000152587890625, 0.520172119140625, 0.5403289794921875, 0.56048583984375, 0.5806427001953125, 0.600799560546875, 0.6209564208984375, 0.64111328125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 4.0, 3.0, 7.0, 6.0, 9.0, 10.0, 11.0, 16.0, 29.0, 33.0, 25.0, 33.0, 35.0, 51.0, 61.0, 67.0, 65.0, 62.0, 85.0, 66.0, 47.0, 47.0, 46.0, 34.0, 38.0, 33.0, 15.0, 9.0, 9.0, 10.0, 6.0, 9.0, 2.0, 5.0, 4.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0023174285888671875, -0.0022553354501724243, -0.002193242311477661, -0.002131149172782898, -0.0020690560340881348, -0.0020069628953933716, -0.0019448697566986084, -0.0018827766180038452, -0.001820683479309082, -0.0017585903406143188, -0.0016964972019195557, -0.0016344040632247925, -0.0015723109245300293, -0.0015102177858352661, -0.001448124647140503, -0.0013860315084457397, -0.0013239383697509766, -0.0012618452310562134, -0.0011997520923614502, -0.001137658953666687, -0.0010755658149719238, -0.0010134726762771606, -0.0009513795375823975, -0.0008892863988876343, -0.0008271932601928711, -0.0007651001214981079, -0.0007030069828033447, -0.0006409138441085815, -0.0005788207054138184, -0.0005167275667190552, -0.000454634428024292, -0.0003925412893295288, -0.0003304481506347656, -0.00026835501194000244, -0.00020626187324523926, -0.00014416873455047607, -8.207559585571289e-05, -1.9982457160949707e-05, 4.2110681533813477e-05, 0.00010420382022857666, 0.00016629695892333984, 0.00022839009761810303, 0.0002904832363128662, 0.0003525763750076294, 0.0004146695137023926, 0.00047676265239715576, 0.0005388557910919189, 0.0006009489297866821, 0.0006630420684814453, 0.0007251352071762085, 0.0007872283458709717, 0.0008493214845657349, 0.000911414623260498, 0.0009735077619552612, 0.0010356009006500244, 0.0010976940393447876, 0.0011597871780395508, 0.001221880316734314, 0.0012839734554290771, 0.0013460665941238403, 0.0014081597328186035, 0.0014702528715133667, 0.0015323460102081299, 0.001594439148902893, 0.0016565322875976562]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 10.0, 4.0, 3.0, 4.0, 10.0, 10.0, 17.0, 26.0, 37.0, 43.0, 64.0, 77.0, 132.0, 231.0, 505.0, 1513.0, 947699.0, 96183.0, 1007.0, 390.0, 185.0, 125.0, 66.0, 60.0, 35.0, 25.0, 21.0, 14.0, 18.0, 10.0, 6.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03753662109375, -0.036188602447509766, -0.03484058380126953, -0.0334925651550293, -0.03214454650878906, -0.030796527862548828, -0.029448509216308594, -0.02810049057006836, -0.026752471923828125, -0.02540445327758789, -0.024056434631347656, -0.022708415985107422, -0.021360397338867188, -0.020012378692626953, -0.01866436004638672, -0.017316341400146484, -0.01596832275390625, -0.014620304107666016, -0.013272285461425781, -0.011924266815185547, -0.010576248168945312, -0.009228229522705078, -0.007880210876464844, -0.006532192230224609, -0.005184173583984375, -0.0038361549377441406, -0.0024881362915039062, -0.0011401176452636719, 0.0002079010009765625, 0.0015559196472167969, 0.0029039382934570312, 0.004251956939697266, 0.0055999755859375, 0.006947994232177734, 0.008296012878417969, 0.009644031524658203, 0.010992050170898438, 0.012340068817138672, 0.013688087463378906, 0.01503610610961914, 0.016384124755859375, 0.01773214340209961, 0.019080162048339844, 0.020428180694580078, 0.021776199340820312, 0.023124217987060547, 0.02447223663330078, 0.025820255279541016, 0.02716827392578125, 0.028516292572021484, 0.02986431121826172, 0.031212329864501953, 0.03256034851074219, 0.03390836715698242, 0.035256385803222656, 0.03660440444946289, 0.037952423095703125, 0.03930044174194336, 0.040648460388183594, 0.04199647903442383, 0.04334449768066406, 0.0446925163269043, 0.04604053497314453, 0.047388553619384766, 0.048736572265625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 17.0, 115.0, 408.0, 365.0, 96.0, 13.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003042767057195306, -0.002920755185186863, -0.0027987430803477764, -0.0026767312083393335, -0.002554719103500247, -0.002432707231491804, -0.0023106951266527176, -0.0021886832546442747, -0.002066671382635832, -0.0019446593942120671, -0.0018226474057883024, -0.0017006355337798595, -0.001578623428940773, -0.0014566115569323301, -0.0013345995685085654, -0.0012125875800848007, -0.0010905754752457142, -0.0009685634868219495, -0.0008465514983981848, -0.000724539568182081, -0.0006025275797583163, -0.00048051559133455157, -0.0003585036611184478, -0.00023649167269468307, -0.00011447968427091837, 7.532289600931108e-06, 0.00012954426347278059, 0.00025155622279271483, 0.00037356821121647954, 0.0004955801996402442, 0.000617592129856348, 0.0007396041182801127, 0.0008616163395345211, 0.0009836283279582858, 0.0011056403163820505, 0.0012276521883904934, 0.00134966429322958, 0.0014716761652380228, 0.0015936881536617875, 0.0017157001420855522, 0.001837712130509317, 0.0019597241189330816, 0.0020817359909415245, 0.002203748095780611, 0.002325759967789054, 0.0024477720726281404, 0.0025697839446365833, 0.00269179604947567, 0.0028138079214841127, 0.0029358197934925556, 0.003057831898331642, 0.003179843770340085, 0.0033018558751791716, 0.0034238677471876144, 0.003545879852026701, 0.003667891724035144, 0.0037899035960435867, 0.003911915700882673, 0.0040339273400604725, 0.004155939444899559, 0.0042779515497386456, 0.004399963654577732, 0.004521975293755531, 0.004643987398594618, 0.004765999503433704]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 2.0, 9.0, 7.0, 5.0, 8.0, 5.0, 19.0, 22.0, 22.0, 28.0, 24.0, 23.0, 25.0, 32.0, 38.0, 39.0, 35.0, 52.0, 41.0, 46.0, 54.0, 45.0, 28.0, 36.0, 39.0, 37.0, 24.0, 30.0, 29.0, 32.0, 28.0, 32.0, 20.0, 15.0, 12.0, 15.0, 17.0, 10.0, 6.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0010434389114379883, -0.001012466847896576, -0.0009814947843551636, -0.0009505227208137512, -0.0009195506572723389, -0.0008885785937309265, -0.0008576065301895142, -0.0008266344666481018, -0.0007956624031066895, -0.0007646903395652771, -0.0007337182760238647, -0.0007027462124824524, -0.00067177414894104, -0.0006408020853996277, -0.0006098300218582153, -0.000578857958316803, -0.0005478858947753906, -0.0005169138312339783, -0.0004859417676925659, -0.00045496970415115356, -0.0004239976406097412, -0.00039302557706832886, -0.0003620535135269165, -0.00033108144998550415, -0.0003001093864440918, -0.00026913732290267944, -0.0002381652593612671, -0.00020719319581985474, -0.00017622113227844238, -0.00014524906873703003, -0.00011427700519561768, -8.330494165420532e-05, -5.233287811279297e-05, -2.1360814571380615e-05, 9.611248970031738e-06, 4.058331251144409e-05, 7.155537605285645e-05, 0.0001025274395942688, 0.00013349950313568115, 0.0001644715666770935, 0.00019544363021850586, 0.0002264156937599182, 0.00025738775730133057, 0.0002883598208427429, 0.0003193318843841553, 0.0003503039479255676, 0.00038127601146698, 0.00041224807500839233, 0.0004432201385498047, 0.00047419220209121704, 0.0005051642656326294, 0.0005361363291740417, 0.0005671083927154541, 0.0005980804562568665, 0.0006290525197982788, 0.0006600245833396912, 0.0006909966468811035, 0.0007219687104225159, 0.0007529407739639282, 0.0007839128375053406, 0.0008148849010467529, 0.0008458569645881653, 0.0008768290281295776, 0.00090780109167099, 0.0009387731552124023]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 8.0, 7.0, 3.0, 4.0, 9.0, 7.0, 5.0, 14.0, 13.0, 12.0, 18.0, 14.0, 16.0, 18.0, 18.0, 27.0, 33.0, 37.0, 38.0, 35.0, 55.0, 42.0, 41.0, 42.0, 35.0, 30.0, 23.0, 36.0, 37.0, 35.0, 26.0, 38.0, 27.0, 23.0, 25.0, 22.0, 26.0, 15.0, 20.0, 9.0, 11.0, 9.0, 9.0, 8.0, 13.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.109375, -4.9544677734375, -4.799560546875, -4.6446533203125, -4.48974609375, -4.3348388671875, -4.179931640625, -4.0250244140625, -3.8701171875, -3.7152099609375, -3.560302734375, -3.4053955078125, -3.25048828125, -3.0955810546875, -2.940673828125, -2.7857666015625, -2.630859375, -2.4759521484375, -2.321044921875, -2.1661376953125, -2.01123046875, -1.8563232421875, -1.701416015625, -1.5465087890625, -1.3916015625, -1.2366943359375, -1.081787109375, -0.9268798828125, -0.77197265625, -0.6170654296875, -0.462158203125, -0.3072509765625, -0.15234375, 0.0025634765625, 0.157470703125, 0.3123779296875, 0.46728515625, 0.6221923828125, 0.777099609375, 0.9320068359375, 1.0869140625, 1.2418212890625, 1.396728515625, 1.5516357421875, 1.70654296875, 1.8614501953125, 2.016357421875, 2.1712646484375, 2.326171875, 2.4810791015625, 2.635986328125, 2.7908935546875, 2.94580078125, 3.1007080078125, 3.255615234375, 3.4105224609375, 3.5654296875, 3.7203369140625, 3.875244140625, 4.0301513671875, 4.18505859375, 4.3399658203125, 4.494873046875, 4.6497802734375, 4.8046875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 6.0, 8.0, 11.0, 19.0, 30.0, 42.0, 88.0, 123.0, 219.0, 335.0, 540.0, 1005.0, 1923.0, 3496.0, 6691.0, 13306.0, 28099.0, 68282.0, 208749.0, 447634.0, 163281.0, 56359.0, 23871.0, 11522.0, 5896.0, 3140.0, 1673.0, 972.0, 510.0, 286.0, 170.0, 108.0, 69.0, 31.0, 25.0, 5.0, 9.0, 8.0, 4.0, 2.0, 11.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.171875, -4.046966552734375, -3.92205810546875, -3.797149658203125, -3.6722412109375, -3.547332763671875, -3.42242431640625, -3.297515869140625, -3.172607421875, -3.047698974609375, -2.92279052734375, -2.797882080078125, -2.6729736328125, -2.548065185546875, -2.42315673828125, -2.298248291015625, -2.17333984375, -2.048431396484375, -1.92352294921875, -1.798614501953125, -1.6737060546875, -1.548797607421875, -1.42388916015625, -1.298980712890625, -1.174072265625, -1.049163818359375, -0.92425537109375, -0.799346923828125, -0.6744384765625, -0.549530029296875, -0.42462158203125, -0.299713134765625, -0.1748046875, -0.049896240234375, 0.07501220703125, 0.199920654296875, 0.3248291015625, 0.449737548828125, 0.57464599609375, 0.699554443359375, 0.824462890625, 0.949371337890625, 1.07427978515625, 1.199188232421875, 1.3240966796875, 1.449005126953125, 1.57391357421875, 1.698822021484375, 1.82373046875, 1.948638916015625, 2.07354736328125, 2.198455810546875, 2.3233642578125, 2.448272705078125, 2.57318115234375, 2.698089599609375, 2.822998046875, 2.947906494140625, 3.07281494140625, 3.197723388671875, 3.3226318359375, 3.447540283203125, 3.57244873046875, 3.697357177734375, 3.822265625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 6.0, 7.0, 8.0, 7.0, 10.0, 11.0, 16.0, 17.0, 22.0, 18.0, 22.0, 28.0, 40.0, 35.0, 34.0, 50.0, 53.0, 81.0, 108.0, 1455.0, 415.0, 126.0, 59.0, 49.0, 59.0, 46.0, 45.0, 29.0, 35.0, 23.0, 22.0, 20.0, 9.0, 17.0, 14.0, 12.0, 13.0, 6.0, 7.0, 9.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-23.359375, -22.691650390625, -22.02392578125, -21.356201171875, -20.6884765625, -20.020751953125, -19.35302734375, -18.685302734375, -18.017578125, -17.349853515625, -16.68212890625, -16.014404296875, -15.3466796875, -14.678955078125, -14.01123046875, -13.343505859375, -12.67578125, -12.008056640625, -11.34033203125, -10.672607421875, -10.0048828125, -9.337158203125, -8.66943359375, -8.001708984375, -7.333984375, -6.666259765625, -5.99853515625, -5.330810546875, -4.6630859375, -3.995361328125, -3.32763671875, -2.659912109375, -1.9921875, -1.324462890625, -0.65673828125, 0.010986328125, 0.6787109375, 1.346435546875, 2.01416015625, 2.681884765625, 3.349609375, 4.017333984375, 4.68505859375, 5.352783203125, 6.0205078125, 6.688232421875, 7.35595703125, 8.023681640625, 8.69140625, 9.359130859375, 10.02685546875, 10.694580078125, 11.3623046875, 12.030029296875, 12.69775390625, 13.365478515625, 14.033203125, 14.700927734375, 15.36865234375, 16.036376953125, 16.7041015625, 17.371826171875, 18.03955078125, 18.707275390625, 19.375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 9.0, 21.0, 52.0, 61.0, 80.0, 133.0, 252.0, 564.0, 3901.0, 3126460.0, 12714.0, 768.0, 273.0, 137.0, 96.0, 57.0, 41.0, 26.0, 18.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-93.75, -90.7861328125, -87.822265625, -84.8583984375, -81.89453125, -78.9306640625, -75.966796875, -73.0029296875, -70.0390625, -67.0751953125, -64.111328125, -61.1474609375, -58.18359375, -55.2197265625, -52.255859375, -49.2919921875, -46.328125, -43.3642578125, -40.400390625, -37.4365234375, -34.47265625, -31.5087890625, -28.544921875, -25.5810546875, -22.6171875, -19.6533203125, -16.689453125, -13.7255859375, -10.76171875, -7.7978515625, -4.833984375, -1.8701171875, 1.09375, 4.0576171875, 7.021484375, 9.9853515625, 12.94921875, 15.9130859375, 18.876953125, 21.8408203125, 24.8046875, 27.7685546875, 30.732421875, 33.6962890625, 36.66015625, 39.6240234375, 42.587890625, 45.5517578125, 48.515625, 51.4794921875, 54.443359375, 57.4072265625, 60.37109375, 63.3349609375, 66.298828125, 69.2626953125, 72.2265625, 75.1904296875, 78.154296875, 81.1181640625, 84.08203125, 87.0458984375, 90.009765625, 92.9736328125, 95.9375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 28.0, 820.0, 169.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.99887084960938, -62.86228942871094, -54.7257080078125, -46.58912658691406, -38.452545166015625, -30.315963745117188, -22.17938232421875, -14.042800903320312, -5.906219482421875, 2.2303619384765625, 10.366943359375, 18.503524780273438, 26.640106201171875, 34.77668762207031, 42.91326904296875, 51.04985046386719, 59.186431884765625, 67.32301330566406, 75.4595947265625, 83.59617614746094, 91.73275756835938, 99.86933898925781, 108.00592041015625, 116.14250183105469, 124.27908325195312, 132.41566467285156, 140.55224609375, 148.68882751464844, 156.82540893554688, 164.9619903564453, 173.09857177734375, 181.2351531982422, 189.37176513671875, 197.5083465576172, 205.64492797851562, 213.78150939941406, 221.9180908203125, 230.05467224121094, 238.19125366210938, 246.3278350830078, 254.46441650390625, 262.60101318359375, 270.7375793457031, 278.8741455078125, 287.0107421875, 295.1473388671875, 303.2839050292969, 311.42047119140625, 319.55706787109375, 327.69366455078125, 335.8302307128906, 343.966796875, 352.1033935546875, 360.239990234375, 368.3765563964844, 376.51312255859375, 384.64971923828125, 392.78631591796875, 400.9228820800781, 409.0594482421875, 417.196044921875, 425.3326416015625, 433.4692077636719, 441.60577392578125, 449.74237060546875]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 4.0, 1.0, 6.0, 9.0, 9.0, 15.0, 10.0, 21.0, 14.0, 17.0, 20.0, 24.0, 37.0, 28.0, 32.0, 40.0, 37.0, 36.0, 42.0, 40.0, 51.0, 58.0, 42.0, 42.0, 39.0, 35.0, 38.0, 27.0, 40.0, 36.0, 32.0, 25.0, 19.0, 19.0, 12.0, 13.0, 7.0, 6.0, 8.0, 5.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.05248260498047, -62.9578742980957, -60.86326217651367, -58.768653869628906, -56.674041748046875, -54.57943344116211, -52.484825134277344, -50.39021301269531, -48.29560470581055, -46.20099639892578, -44.10638427734375, -42.011775970458984, -39.91716766357422, -37.82255554199219, -35.72794723510742, -33.633338928222656, -31.538726806640625, -29.444116592407227, -27.349506378173828, -25.254898071289062, -23.160287857055664, -21.065677642822266, -18.9710693359375, -16.8764591217041, -14.781848907470703, -12.687238693237305, -10.592629432678223, -8.49802017211914, -6.403409957885742, -4.308799743652344, -2.2141904830932617, -0.11958122253417969, 1.9750213623046875, 4.069631099700928, 6.164240837097168, 8.25885009765625, 10.353460311889648, 12.448070526123047, 14.542679786682129, 16.63728904724121, 18.73189926147461, 20.826509475708008, 22.921119689941406, 25.015727996826172, 27.11033821105957, 29.20494842529297, 31.299556732177734, 33.3941650390625, 35.48877716064453, 37.5833854675293, 39.67799758911133, 41.772605895996094, 43.867218017578125, 45.96182632446289, 48.056434631347656, 50.15104675292969, 52.24565505981445, 54.34026336669922, 56.43487548828125, 58.529483795166016, 60.62409210205078, 62.71870422363281, 64.81331634521484, 66.90792083740234, 69.00253295898438]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 5.0, 6.0, 9.0, 8.0, 6.0, 8.0, 6.0, 18.0, 13.0, 12.0, 17.0, 13.0, 16.0, 27.0, 25.0, 32.0, 27.0, 39.0, 42.0, 47.0, 43.0, 33.0, 41.0, 41.0, 39.0, 37.0, 33.0, 31.0, 33.0, 31.0, 33.0, 27.0, 27.0, 20.0, 20.0, 25.0, 19.0, 16.0, 17.0, 12.0, 13.0, 4.0, 9.0, 5.0, 8.0, 2.0, 4.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-5.78125, -5.6123046875, -5.443359375, -5.2744140625, -5.10546875, -4.9365234375, -4.767578125, -4.5986328125, -4.4296875, -4.2607421875, -4.091796875, -3.9228515625, -3.75390625, -3.5849609375, -3.416015625, -3.2470703125, -3.078125, -2.9091796875, -2.740234375, -2.5712890625, -2.40234375, -2.2333984375, -2.064453125, -1.8955078125, -1.7265625, -1.5576171875, -1.388671875, -1.2197265625, -1.05078125, -0.8818359375, -0.712890625, -0.5439453125, -0.375, -0.2060546875, -0.037109375, 0.1318359375, 0.30078125, 0.4697265625, 0.638671875, 0.8076171875, 0.9765625, 1.1455078125, 1.314453125, 1.4833984375, 1.65234375, 1.8212890625, 1.990234375, 2.1591796875, 2.328125, 2.4970703125, 2.666015625, 2.8349609375, 3.00390625, 3.1728515625, 3.341796875, 3.5107421875, 3.6796875, 3.8486328125, 4.017578125, 4.1865234375, 4.35546875, 4.5244140625, 4.693359375, 4.8623046875, 5.03125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 6.0, 2.0, 11.0, 8.0, 11.0, 23.0, 32.0, 37.0, 51.0, 63.0, 91.0, 112.0, 156.0, 283.0, 515.0, 933.0, 2210.0, 5890.0, 18421.0, 77799.0, 431616.0, 1502441.0, 1560271.0, 473748.0, 88567.0, 20320.0, 6099.0, 2264.0, 930.0, 479.0, 290.0, 160.0, 115.0, 87.0, 68.0, 45.0, 45.0, 27.0, 22.0, 17.0, 8.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5234375, -8.265380859375, -8.00732421875, -7.749267578125, -7.4912109375, -7.233154296875, -6.97509765625, -6.717041015625, -6.458984375, -6.200927734375, -5.94287109375, -5.684814453125, -5.4267578125, -5.168701171875, -4.91064453125, -4.652587890625, -4.39453125, -4.136474609375, -3.87841796875, -3.620361328125, -3.3623046875, -3.104248046875, -2.84619140625, -2.588134765625, -2.330078125, -2.072021484375, -1.81396484375, -1.555908203125, -1.2978515625, -1.039794921875, -0.78173828125, -0.523681640625, -0.265625, -0.007568359375, 0.25048828125, 0.508544921875, 0.7666015625, 1.024658203125, 1.28271484375, 1.540771484375, 1.798828125, 2.056884765625, 2.31494140625, 2.572998046875, 2.8310546875, 3.089111328125, 3.34716796875, 3.605224609375, 3.86328125, 4.121337890625, 4.37939453125, 4.637451171875, 4.8955078125, 5.153564453125, 5.41162109375, 5.669677734375, 5.927734375, 6.185791015625, 6.44384765625, 6.701904296875, 6.9599609375, 7.218017578125, 7.47607421875, 7.734130859375, 7.9921875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 5.0, 6.0, 3.0, 3.0, 14.0, 15.0, 29.0, 34.0, 43.0, 67.0, 76.0, 118.0, 153.0, 197.0, 304.0, 395.0, 447.0, 432.0, 410.0, 335.0, 273.0, 193.0, 160.0, 104.0, 69.0, 44.0, 46.0, 35.0, 17.0, 15.0, 16.0, 5.0, 2.0, 5.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.734375, -11.334716796875, -10.93505859375, -10.535400390625, -10.1357421875, -9.736083984375, -9.33642578125, -8.936767578125, -8.537109375, -8.137451171875, -7.73779296875, -7.338134765625, -6.9384765625, -6.538818359375, -6.13916015625, -5.739501953125, -5.33984375, -4.940185546875, -4.54052734375, -4.140869140625, -3.7412109375, -3.341552734375, -2.94189453125, -2.542236328125, -2.142578125, -1.742919921875, -1.34326171875, -0.943603515625, -0.5439453125, -0.144287109375, 0.25537109375, 0.655029296875, 1.0546875, 1.454345703125, 1.85400390625, 2.253662109375, 2.6533203125, 3.052978515625, 3.45263671875, 3.852294921875, 4.251953125, 4.651611328125, 5.05126953125, 5.450927734375, 5.8505859375, 6.250244140625, 6.64990234375, 7.049560546875, 7.44921875, 7.848876953125, 8.24853515625, 8.648193359375, 9.0478515625, 9.447509765625, 9.84716796875, 10.246826171875, 10.646484375, 11.046142578125, 11.44580078125, 11.845458984375, 12.2451171875, 12.644775390625, 13.04443359375, 13.444091796875, 13.84375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 5.0, 8.0, 5.0, 16.0, 18.0, 16.0, 16.0, 40.0, 45.0, 53.0, 68.0, 83.0, 100.0, 167.0, 268.0, 399.0, 987.0, 6446.0, 246597.0, 3797319.0, 135106.0, 4457.0, 833.0, 383.0, 240.0, 151.0, 111.0, 76.0, 62.0, 50.0, 27.0, 22.0, 22.0, 20.0, 24.0, 11.0, 9.0, 5.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.390625, -30.246337890625, -29.10205078125, -27.957763671875, -26.8134765625, -25.669189453125, -24.52490234375, -23.380615234375, -22.236328125, -21.092041015625, -19.94775390625, -18.803466796875, -17.6591796875, -16.514892578125, -15.37060546875, -14.226318359375, -13.08203125, -11.937744140625, -10.79345703125, -9.649169921875, -8.5048828125, -7.360595703125, -6.21630859375, -5.072021484375, -3.927734375, -2.783447265625, -1.63916015625, -0.494873046875, 0.6494140625, 1.793701171875, 2.93798828125, 4.082275390625, 5.2265625, 6.370849609375, 7.51513671875, 8.659423828125, 9.8037109375, 10.947998046875, 12.09228515625, 13.236572265625, 14.380859375, 15.525146484375, 16.66943359375, 17.813720703125, 18.9580078125, 20.102294921875, 21.24658203125, 22.390869140625, 23.53515625, 24.679443359375, 25.82373046875, 26.968017578125, 28.1123046875, 29.256591796875, 30.40087890625, 31.545166015625, 32.689453125, 33.833740234375, 34.97802734375, 36.122314453125, 37.2666015625, 38.410888671875, 39.55517578125, 40.699462890625, 41.84375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 13.0, 18.0, 89.0, 136.0, 247.0, 222.0, 153.0, 93.0, 26.0, 10.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.01139831542969, -81.48544311523438, -77.9594955444336, -74.43354034423828, -70.90758514404297, -67.38163757324219, -63.855682373046875, -60.32973098754883, -56.80377960205078, -53.277828216552734, -49.75187301635742, -46.225921630859375, -42.69997024536133, -39.17401885986328, -35.64806365966797, -32.12211227416992, -28.59615707397461, -25.07020378112793, -21.544252395629883, -18.018299102783203, -14.49234676361084, -10.966394424438477, -7.440441131591797, -3.91448974609375, -0.3885364532470703, 3.137416124343872, 6.6633687019348145, 10.189321517944336, 13.7152738571167, 17.241226196289062, 20.767179489135742, 24.29313087463379, 27.81908416748047, 31.34503746032715, 34.87099075317383, 38.396942138671875, 41.92289352416992, 45.44884490966797, 48.97480010986328, 52.50075149536133, 56.026702880859375, 59.55265426635742, 63.078609466552734, 66.60456085205078, 70.1305160522461, 73.65646362304688, 77.18241882324219, 80.7083740234375, 84.23432922363281, 87.76028442382812, 91.2862319946289, 94.81218719482422, 98.33814239501953, 101.86408996582031, 105.39004516601562, 108.91600036621094, 112.44194793701172, 115.96790313720703, 119.49385070800781, 123.01980590820312, 126.54576110839844, 130.07171630859375, 133.59765625, 137.1236114501953, 140.64956665039062]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 7.0, 9.0, 13.0, 12.0, 16.0, 15.0, 23.0, 25.0, 19.0, 36.0, 35.0, 33.0, 42.0, 33.0, 46.0, 39.0, 50.0, 34.0, 47.0, 51.0, 45.0, 38.0, 37.0, 32.0, 42.0, 25.0, 25.0, 20.0, 24.0, 19.0, 19.0, 12.0, 16.0, 9.0, 9.0, 7.0, 3.0, 6.0, 8.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-40.776039123535156, -39.480377197265625, -38.18471908569336, -36.88905715942383, -35.59339904785156, -34.29773712158203, -33.0020751953125, -31.706417083740234, -30.410755157470703, -29.115095138549805, -27.819435119628906, -26.523773193359375, -25.228113174438477, -23.932453155517578, -22.63679313659668, -21.34113311767578, -20.045473098754883, -18.749813079833984, -17.454153060913086, -16.158493041992188, -14.862831115722656, -13.567171096801758, -12.27151107788086, -10.975850105285645, -9.680190086364746, -8.384530067443848, -7.088869094848633, -5.793209075927734, -4.497548580169678, -3.201888084411621, -1.9062280654907227, -0.6105670928955078, 0.6850929260253906, 1.9807533025741577, 3.276413679122925, 4.572073936462402, 5.867734432220459, 7.163394927978516, 8.459054946899414, 9.754715919494629, 11.050375938415527, 12.346035957336426, 13.64169692993164, 14.937356948852539, 16.233016967773438, 17.52867889404297, 18.824337005615234, 20.119998931884766, 21.415658950805664, 22.711318969726562, 24.00697898864746, 25.30263900756836, 26.59830093383789, 27.89396095275879, 29.189620971679688, 30.48528289794922, 31.780941009521484, 33.076602935791016, 34.37226104736328, 35.66792297363281, 36.96358108520508, 38.25924301147461, 39.554901123046875, 40.850563049316406, 42.14622497558594]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 9.0, 9.0, 8.0, 14.0, 7.0, 16.0, 23.0, 13.0, 16.0, 26.0, 26.0, 29.0, 27.0, 38.0, 31.0, 36.0, 44.0, 42.0, 53.0, 36.0, 34.0, 58.0, 30.0, 33.0, 31.0, 32.0, 26.0, 22.0, 33.0, 24.0, 30.0, 20.0, 22.0, 18.0, 14.0, 12.0, 8.0, 12.0, 6.0, 6.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.00390625, -5.825439453125, -5.64697265625, -5.468505859375, -5.2900390625, -5.111572265625, -4.93310546875, -4.754638671875, -4.576171875, -4.397705078125, -4.21923828125, -4.040771484375, -3.8623046875, -3.683837890625, -3.50537109375, -3.326904296875, -3.1484375, -2.969970703125, -2.79150390625, -2.613037109375, -2.4345703125, -2.256103515625, -2.07763671875, -1.899169921875, -1.720703125, -1.542236328125, -1.36376953125, -1.185302734375, -1.0068359375, -0.828369140625, -0.64990234375, -0.471435546875, -0.29296875, -0.114501953125, 0.06396484375, 0.242431640625, 0.4208984375, 0.599365234375, 0.77783203125, 0.956298828125, 1.134765625, 1.313232421875, 1.49169921875, 1.670166015625, 1.8486328125, 2.027099609375, 2.20556640625, 2.384033203125, 2.5625, 2.740966796875, 2.91943359375, 3.097900390625, 3.2763671875, 3.454833984375, 3.63330078125, 3.811767578125, 3.990234375, 4.168701171875, 4.34716796875, 4.525634765625, 4.7041015625, 4.882568359375, 5.06103515625, 5.239501953125, 5.41796875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 7.0, 2.0, 10.0, 11.0, 27.0, 35.0, 48.0, 48.0, 91.0, 127.0, 165.0, 259.0, 413.0, 577.0, 860.0, 1220.0, 1834.0, 2821.0, 4642.0, 7098.0, 11218.0, 18655.0, 30988.0, 53651.0, 97272.0, 174826.0, 239050.0, 173154.0, 95962.0, 53048.0, 30658.0, 18418.0, 11259.0, 6997.0, 4504.0, 3020.0, 1928.0, 1234.0, 799.0, 532.0, 355.0, 255.0, 151.0, 105.0, 74.0, 48.0, 36.0, 27.0, 21.0, 8.0, 9.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.77978515625, -0.756500244140625, -0.73321533203125, -0.709930419921875, -0.6866455078125, -0.663360595703125, -0.64007568359375, -0.616790771484375, -0.593505859375, -0.570220947265625, -0.54693603515625, -0.523651123046875, -0.5003662109375, -0.477081298828125, -0.45379638671875, -0.430511474609375, -0.4072265625, -0.383941650390625, -0.36065673828125, -0.337371826171875, -0.3140869140625, -0.290802001953125, -0.26751708984375, -0.244232177734375, -0.220947265625, -0.197662353515625, -0.17437744140625, -0.151092529296875, -0.1278076171875, -0.104522705078125, -0.08123779296875, -0.057952880859375, -0.03466796875, -0.011383056640625, 0.01190185546875, 0.035186767578125, 0.0584716796875, 0.081756591796875, 0.10504150390625, 0.128326416015625, 0.151611328125, 0.174896240234375, 0.19818115234375, 0.221466064453125, 0.2447509765625, 0.268035888671875, 0.29132080078125, 0.314605712890625, 0.337890625, 0.361175537109375, 0.38446044921875, 0.407745361328125, 0.4310302734375, 0.454315185546875, 0.47760009765625, 0.500885009765625, 0.524169921875, 0.547454833984375, 0.57073974609375, 0.594024658203125, 0.6173095703125, 0.640594482421875, 0.66387939453125, 0.687164306640625, 0.71044921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 7.0, 5.0, 6.0, 9.0, 7.0, 15.0, 12.0, 17.0, 14.0, 11.0, 21.0, 27.0, 23.0, 27.0, 32.0, 30.0, 36.0, 40.0, 42.0, 50.0, 37.0, 32.0, 1067.0, 36.0, 46.0, 41.0, 45.0, 29.0, 41.0, 31.0, 25.0, 22.0, 17.0, 21.0, 16.0, 14.0, 17.0, 9.0, 14.0, 11.0, 6.0, 5.0, 6.0, 6.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.634765625, -3.517669677734375, -3.40057373046875, -3.283477783203125, -3.1663818359375, -3.049285888671875, -2.93218994140625, -2.815093994140625, -2.697998046875, -2.580902099609375, -2.46380615234375, -2.346710205078125, -2.2296142578125, -2.112518310546875, -1.99542236328125, -1.878326416015625, -1.76123046875, -1.644134521484375, -1.52703857421875, -1.409942626953125, -1.2928466796875, -1.175750732421875, -1.05865478515625, -0.941558837890625, -0.824462890625, -0.707366943359375, -0.59027099609375, -0.473175048828125, -0.3560791015625, -0.238983154296875, -0.12188720703125, -0.004791259765625, 0.1123046875, 0.229400634765625, 0.34649658203125, 0.463592529296875, 0.5806884765625, 0.697784423828125, 0.81488037109375, 0.931976318359375, 1.049072265625, 1.166168212890625, 1.28326416015625, 1.400360107421875, 1.5174560546875, 1.634552001953125, 1.75164794921875, 1.868743896484375, 1.98583984375, 2.102935791015625, 2.22003173828125, 2.337127685546875, 2.4542236328125, 2.571319580078125, 2.68841552734375, 2.805511474609375, 2.922607421875, 3.039703369140625, 3.15679931640625, 3.273895263671875, 3.3909912109375, 3.508087158203125, 3.62518310546875, 3.742279052734375, 3.859375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 7.0, 2.0, 7.0, 16.0, 20.0, 27.0, 41.0, 54.0, 102.0, 134.0, 244.0, 380.0, 564.0, 882.0, 1391.0, 2231.0, 3623.0, 5847.0, 9201.0, 15484.0, 26362.0, 45476.0, 83173.0, 152791.0, 1281297.0, 201615.0, 115659.0, 63174.0, 35026.0, 20337.0, 12203.0, 7509.0, 4621.0, 2790.0, 1740.0, 1097.0, 698.0, 463.0, 261.0, 190.0, 143.0, 92.0, 51.0, 33.0, 29.0, 14.0, 16.0, 10.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7197265625, -0.6977615356445312, -0.6757965087890625, -0.6538314819335938, -0.631866455078125, -0.6099014282226562, -0.5879364013671875, -0.5659713745117188, -0.54400634765625, -0.5220413208007812, -0.5000762939453125, -0.47811126708984375, -0.456146240234375, -0.43418121337890625, -0.4122161865234375, -0.39025115966796875, -0.3682861328125, -0.34632110595703125, -0.3243560791015625, -0.30239105224609375, -0.280426025390625, -0.25846099853515625, -0.2364959716796875, -0.21453094482421875, -0.19256591796875, -0.17060089111328125, -0.1486358642578125, -0.12667083740234375, -0.104705810546875, -0.08274078369140625, -0.0607757568359375, -0.03881072998046875, -0.016845703125, 0.00511932373046875, 0.0270843505859375, 0.04904937744140625, 0.071014404296875, 0.09297943115234375, 0.1149444580078125, 0.13690948486328125, 0.15887451171875, 0.18083953857421875, 0.2028045654296875, 0.22476959228515625, 0.246734619140625, 0.26869964599609375, 0.2906646728515625, 0.31262969970703125, 0.3345947265625, 0.35655975341796875, 0.3785247802734375, 0.40048980712890625, 0.422454833984375, 0.44441986083984375, 0.4663848876953125, 0.48834991455078125, 0.51031494140625, 0.5322799682617188, 0.5542449951171875, 0.5762100219726562, 0.598175048828125, 0.6201400756835938, 0.6421051025390625, 0.6640701293945312, 0.68603515625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 2.0, 3.0, 10.0, 16.0, 16.0, 25.0, 38.0, 54.0, 59.0, 55.0, 70.0, 61.0, 74.0, 87.0, 69.0, 60.0, 51.0, 42.0, 52.0, 26.0, 26.0, 23.0, 15.0, 12.0, 14.0, 10.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021419525146484375, -0.0020746588706970215, -0.0020073652267456055, -0.0019400715827941895, -0.0018727779388427734, -0.0018054842948913574, -0.0017381906509399414, -0.0016708970069885254, -0.0016036033630371094, -0.0015363097190856934, -0.0014690160751342773, -0.0014017224311828613, -0.0013344287872314453, -0.0012671351432800293, -0.0011998414993286133, -0.0011325478553771973, -0.0010652542114257812, -0.0009979605674743652, -0.0009306669235229492, -0.0008633732795715332, -0.0007960796356201172, -0.0007287859916687012, -0.0006614923477172852, -0.0005941987037658691, -0.0005269050598144531, -0.0004596114158630371, -0.0003923177719116211, -0.0003250241279602051, -0.00025773048400878906, -0.00019043684005737305, -0.00012314319610595703, -5.5849552154541016e-05, 1.1444091796875e-05, 7.873773574829102e-05, 0.00014603137969970703, 0.00021332502365112305, 0.00028061866760253906, 0.0003479123115539551, 0.0004152059555053711, 0.0004824995994567871, 0.0005497932434082031, 0.0006170868873596191, 0.0006843805313110352, 0.0007516741752624512, 0.0008189678192138672, 0.0008862614631652832, 0.0009535551071166992, 0.0010208487510681152, 0.0010881423950195312, 0.0011554360389709473, 0.0012227296829223633, 0.0012900233268737793, 0.0013573169708251953, 0.0014246106147766113, 0.0014919042587280273, 0.0015591979026794434, 0.0016264915466308594, 0.0016937851905822754, 0.0017610788345336914, 0.0018283724784851074, 0.0018956661224365234, 0.0019629597663879395, 0.0020302534103393555, 0.0020975470542907715, 0.0021648406982421875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 4.0, 8.0, 13.0, 17.0, 18.0, 36.0, 36.0, 52.0, 58.0, 118.0, 213.0, 400.0, 1465.0, 954519.0, 89849.0, 927.0, 347.0, 143.0, 105.0, 67.0, 59.0, 26.0, 16.0, 13.0, 6.0, 4.0, 6.0, 7.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.050079345703125, -0.04855489730834961, -0.04703044891357422, -0.04550600051879883, -0.04398155212402344, -0.04245710372924805, -0.040932655334472656, -0.039408206939697266, -0.037883758544921875, -0.036359310150146484, -0.034834861755371094, -0.0333104133605957, -0.03178596496582031, -0.030261516571044922, -0.02873706817626953, -0.02721261978149414, -0.02568817138671875, -0.02416372299194336, -0.02263927459716797, -0.021114826202392578, -0.019590377807617188, -0.018065929412841797, -0.016541481018066406, -0.015017032623291016, -0.013492584228515625, -0.011968135833740234, -0.010443687438964844, -0.008919239044189453, -0.0073947906494140625, -0.005870342254638672, -0.004345893859863281, -0.0028214454650878906, -0.0012969970703125, 0.00022745132446289062, 0.0017518997192382812, 0.003276348114013672, 0.0048007965087890625, 0.006325244903564453, 0.007849693298339844, 0.009374141693115234, 0.010898590087890625, 0.012423038482666016, 0.013947486877441406, 0.015471935272216797, 0.016996383666992188, 0.018520832061767578, 0.02004528045654297, 0.02156972885131836, 0.02309417724609375, 0.02461862564086914, 0.02614307403564453, 0.027667522430419922, 0.029191970825195312, 0.030716419219970703, 0.032240867614746094, 0.033765316009521484, 0.035289764404296875, 0.036814212799072266, 0.038338661193847656, 0.03986310958862305, 0.04138755798339844, 0.04291200637817383, 0.04443645477294922, 0.04596090316772461, 0.0474853515625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 55.0, 582.0, 364.0, 11.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012366867624223232, -0.012145215645432472, -0.011923563666641712, -0.011701912619173527, -0.011480260640382767, -0.011258608661592007, -0.011036956682801247, -0.010815305635333061, -0.010593653656542301, -0.010372001677751541, -0.010150349698960781, -0.009928698651492596, -0.009707046672701836, -0.009485394693911076, -0.009263742715120316, -0.00904209166765213, -0.008820438757538795, -0.008598786778748035, -0.008377134799957275, -0.00815548375248909, -0.00793383177369833, -0.00771217979490757, -0.00749052781611681, -0.007268876302987337, -0.007047224789857864, -0.006825572811067104, -0.006603921297937632, -0.006382269319146872, -0.006160617806017399, -0.005938965827226639, -0.005717313848435879, -0.005495662335306406, -0.005274011287838221, -0.0050523593090474606, -0.004830707795917988, -0.004609055817127228, -0.004387404303997755, -0.004165752325206995, -0.003944100812077522, -0.0037224488332867622, -0.003500797087326646, -0.0032791453413665295, -0.003057493595406413, -0.0028358418494462967, -0.0026141898706555367, -0.002392538357526064, -0.002170886378735304, -0.0019492346327751875, -0.001727582886815071, -0.0015059311408549547, -0.0012842793948948383, -0.0010626275325194001, -0.0008409757865592837, -0.0006193240405991673, -0.00039767217822372913, -0.00017602043226361275, 4.563131369650364e-05, 0.0002672830887604505, 0.0004889348638243973, 0.0007105866679921746, 0.000932238413952291, 0.0011538901599124074, 0.0013755420222878456, 0.001597193768247962, 0.0018188455142080784]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 8.0, 7.0, 8.0, 9.0, 8.0, 9.0, 20.0, 19.0, 23.0, 16.0, 34.0, 25.0, 27.0, 36.0, 40.0, 41.0, 43.0, 43.0, 38.0, 36.0, 46.0, 42.0, 46.0, 47.0, 35.0, 43.0, 34.0, 30.0, 29.0, 31.0, 22.0, 13.0, 20.0, 13.0, 13.0, 7.0, 9.0, 4.0, 7.0, 8.0, 5.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0009273290634155273, -0.0008969549089670181, -0.0008665807545185089, -0.0008362066000699997, -0.0008058324456214905, -0.0007754582911729813, -0.000745084136724472, -0.0007147099822759628, -0.0006843358278274536, -0.0006539616733789444, -0.0006235875189304352, -0.000593213364481926, -0.0005628392100334167, -0.0005324650555849075, -0.0005020909011363983, -0.0004717167466878891, -0.0004413425922393799, -0.00041096843779087067, -0.00038059428334236145, -0.00035022012889385223, -0.000319845974445343, -0.0002894718199968338, -0.0002590976655483246, -0.00022872351109981537, -0.00019834935665130615, -0.00016797520220279694, -0.00013760104775428772, -0.0001072268933057785, -7.685273885726929e-05, -4.647858440876007e-05, -1.6104429960250854e-05, 1.4269724488258362e-05, 4.464387893676758e-05, 7.50180333852768e-05, 0.00010539218783378601, 0.00013576634228229523, 0.00016614049673080444, 0.00019651465117931366, 0.00022688880562782288, 0.0002572629600763321, 0.0002876371145248413, 0.0003180112689733505, 0.00034838542342185974, 0.00037875957787036896, 0.0004091337323188782, 0.0004395078867673874, 0.0004698820412158966, 0.0005002561956644058, 0.000530630350112915, 0.0005610045045614243, 0.0005913786590099335, 0.0006217528134584427, 0.0006521269679069519, 0.0006825011223554611, 0.0007128752768039703, 0.0007432494312524796, 0.0007736235857009888, 0.000803997740149498, 0.0008343718945980072, 0.0008647460490465164, 0.0008951202034950256, 0.0009254943579435349, 0.0009558685123920441, 0.0009862426668405533, 0.0010166168212890625]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 7.0, 9.0, 9.0, 8.0, 14.0, 7.0, 16.0, 23.0, 13.0, 16.0, 26.0, 26.0, 29.0, 27.0, 38.0, 31.0, 36.0, 44.0, 42.0, 53.0, 36.0, 34.0, 58.0, 30.0, 33.0, 31.0, 32.0, 26.0, 22.0, 33.0, 24.0, 30.0, 20.0, 22.0, 18.0, 14.0, 12.0, 8.0, 12.0, 6.0, 6.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.00390625, -5.825439453125, -5.64697265625, -5.468505859375, -5.2900390625, -5.111572265625, -4.93310546875, -4.754638671875, -4.576171875, -4.397705078125, -4.21923828125, -4.040771484375, -3.8623046875, -3.683837890625, -3.50537109375, -3.326904296875, -3.1484375, -2.969970703125, -2.79150390625, -2.613037109375, -2.4345703125, -2.256103515625, -2.07763671875, -1.899169921875, -1.720703125, -1.542236328125, -1.36376953125, -1.185302734375, -1.0068359375, -0.828369140625, -0.64990234375, -0.471435546875, -0.29296875, -0.114501953125, 0.06396484375, 0.242431640625, 0.4208984375, 0.599365234375, 0.77783203125, 0.956298828125, 1.134765625, 1.313232421875, 1.49169921875, 1.670166015625, 1.8486328125, 2.027099609375, 2.20556640625, 2.384033203125, 2.5625, 2.740966796875, 2.91943359375, 3.097900390625, 3.2763671875, 3.454833984375, 3.63330078125, 3.811767578125, 3.990234375, 4.168701171875, 4.34716796875, 4.525634765625, 4.7041015625, 4.882568359375, 5.06103515625, 5.239501953125, 5.41796875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 9.0, 19.0, 8.0, 28.0, 43.0, 87.0, 120.0, 185.0, 344.0, 590.0, 1334.0, 2881.0, 7618.0, 22143.0, 76238.0, 304756.0, 462140.0, 118240.0, 33483.0, 10881.0, 3916.0, 1684.0, 814.0, 413.0, 227.0, 146.0, 80.0, 45.0, 35.0, 23.0, 9.0, 7.0, 7.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3359375, -6.1505126953125, -5.965087890625, -5.7796630859375, -5.59423828125, -5.4088134765625, -5.223388671875, -5.0379638671875, -4.8525390625, -4.6671142578125, -4.481689453125, -4.2962646484375, -4.11083984375, -3.9254150390625, -3.739990234375, -3.5545654296875, -3.369140625, -3.1837158203125, -2.998291015625, -2.8128662109375, -2.62744140625, -2.4420166015625, -2.256591796875, -2.0711669921875, -1.8857421875, -1.7003173828125, -1.514892578125, -1.3294677734375, -1.14404296875, -0.9586181640625, -0.773193359375, -0.5877685546875, -0.40234375, -0.2169189453125, -0.031494140625, 0.1539306640625, 0.33935546875, 0.5247802734375, 0.710205078125, 0.8956298828125, 1.0810546875, 1.2664794921875, 1.451904296875, 1.6373291015625, 1.82275390625, 2.0081787109375, 2.193603515625, 2.3790283203125, 2.564453125, 2.7498779296875, 2.935302734375, 3.1207275390625, 3.30615234375, 3.4915771484375, 3.677001953125, 3.8624267578125, 4.0478515625, 4.2332763671875, 4.418701171875, 4.6041259765625, 4.78955078125, 4.9749755859375, 5.160400390625, 5.3458251953125, 5.53125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 4.0, 1.0, 1.0, 11.0, 13.0, 13.0, 17.0, 22.0, 33.0, 25.0, 37.0, 47.0, 45.0, 59.0, 92.0, 171.0, 1767.0, 222.0, 83.0, 66.0, 61.0, 50.0, 50.0, 30.0, 23.0, 25.0, 21.0, 11.0, 6.0, 6.0, 9.0, 11.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.9375, -34.92822265625, -33.9189453125, -32.90966796875, -31.900390625, -30.89111328125, -29.8818359375, -28.87255859375, -27.86328125, -26.85400390625, -25.8447265625, -24.83544921875, -23.826171875, -22.81689453125, -21.8076171875, -20.79833984375, -19.7890625, -18.77978515625, -17.7705078125, -16.76123046875, -15.751953125, -14.74267578125, -13.7333984375, -12.72412109375, -11.71484375, -10.70556640625, -9.6962890625, -8.68701171875, -7.677734375, -6.66845703125, -5.6591796875, -4.64990234375, -3.640625, -2.63134765625, -1.6220703125, -0.61279296875, 0.396484375, 1.40576171875, 2.4150390625, 3.42431640625, 4.43359375, 5.44287109375, 6.4521484375, 7.46142578125, 8.470703125, 9.47998046875, 10.4892578125, 11.49853515625, 12.5078125, 13.51708984375, 14.5263671875, 15.53564453125, 16.544921875, 17.55419921875, 18.5634765625, 19.57275390625, 20.58203125, 21.59130859375, 22.6005859375, 23.60986328125, 24.619140625, 25.62841796875, 26.6376953125, 27.64697265625, 28.65625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 3.0, 12.0, 6.0, 13.0, 10.0, 14.0, 36.0, 35.0, 53.0, 56.0, 98.0, 133.0, 150.0, 284.0, 522.0, 1698.0, 2626829.0, 513092.0, 1354.0, 472.0, 249.0, 176.0, 108.0, 81.0, 46.0, 54.0, 26.0, 24.0, 21.0, 11.0, 10.0, 5.0, 5.0, 3.0, 0.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.0, -56.810546875, -54.62109375, -52.431640625, -50.2421875, -48.052734375, -45.86328125, -43.673828125, -41.484375, -39.294921875, -37.10546875, -34.916015625, -32.7265625, -30.537109375, -28.34765625, -26.158203125, -23.96875, -21.779296875, -19.58984375, -17.400390625, -15.2109375, -13.021484375, -10.83203125, -8.642578125, -6.453125, -4.263671875, -2.07421875, 0.115234375, 2.3046875, 4.494140625, 6.68359375, 8.873046875, 11.0625, 13.251953125, 15.44140625, 17.630859375, 19.8203125, 22.009765625, 24.19921875, 26.388671875, 28.578125, 30.767578125, 32.95703125, 35.146484375, 37.3359375, 39.525390625, 41.71484375, 43.904296875, 46.09375, 48.283203125, 50.47265625, 52.662109375, 54.8515625, 57.041015625, 59.23046875, 61.419921875, 63.609375, 65.798828125, 67.98828125, 70.177734375, 72.3671875, 74.556640625, 76.74609375, 78.935546875, 81.125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 19.0, 50.0, 151.0, 301.0, 292.0, 146.0, 39.0, 16.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.77010154724121, -15.090267181396484, -13.410432815551758, -11.730599403381348, -10.050765037536621, -8.370930671691895, -6.691097259521484, -5.011262893676758, -3.3314285278320312, -1.6515944004058838, 0.028239727020263672, 1.708073616027832, 3.3879079818725586, 5.067742347717285, 6.747575759887695, 8.427410125732422, 10.107244491577148, 11.787078857421875, 13.466913223266602, 15.146746635437012, 16.826580047607422, 18.50641632080078, 20.186248779296875, 21.8660831451416, 23.545917510986328, 25.225751876831055, 26.90558624267578, 28.585418701171875, 30.265254974365234, 31.945087432861328, 33.62492370605469, 35.30475616455078, 36.984588623046875, 38.66442108154297, 40.34425735473633, 42.02408981323242, 43.70392608642578, 45.383758544921875, 47.06359100341797, 48.74342727661133, 50.42326354980469, 52.10309600830078, 53.78293228149414, 55.462764739990234, 57.142601013183594, 58.82243347167969, 60.50226593017578, 62.18210220336914, 63.861934661865234, 65.5417709350586, 67.22160339355469, 68.90143585205078, 70.58126831054688, 72.2611083984375, 73.9409408569336, 75.62077331542969, 77.30060577392578, 78.98043823242188, 80.66027069091797, 82.3401107788086, 84.01994323730469, 85.69977569580078, 87.37960815429688, 89.0594482421875, 90.7392807006836]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 2.0, 6.0, 5.0, 6.0, 8.0, 11.0, 14.0, 11.0, 13.0, 12.0, 20.0, 25.0, 28.0, 33.0, 28.0, 35.0, 23.0, 39.0, 42.0, 39.0, 45.0, 37.0, 44.0, 37.0, 39.0, 34.0, 45.0, 25.0, 31.0, 32.0, 35.0, 31.0, 31.0, 16.0, 22.0, 12.0, 10.0, 11.0, 8.0, 14.0, 6.0, 11.0, 2.0, 5.0, 9.0, 7.0, 7.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-59.63533020019531, -57.91346740722656, -56.19160079956055, -54.4697380065918, -52.74787139892578, -51.02600860595703, -49.30414581298828, -47.58228302001953, -45.860416412353516, -44.138553619384766, -42.41668701171875, -40.69482421875, -38.97296142578125, -37.251094818115234, -35.529232025146484, -33.80736541748047, -32.08550262451172, -30.363637924194336, -28.641773223876953, -26.919910430908203, -25.19804573059082, -23.476181030273438, -21.754318237304688, -20.032453536987305, -18.310588836669922, -16.58872413635254, -14.866860389709473, -13.144996643066406, -11.423131942749023, -9.70126724243164, -7.979403495788574, -6.257539749145508, -4.535675048828125, -2.8138108253479004, -1.0919466018676758, 0.6299176216125488, 2.3517818450927734, 4.073646545410156, 5.795510292053223, 7.517374038696289, 9.239238739013672, 10.961103439331055, 12.682967185974121, 14.404830932617188, 16.12669563293457, 17.848560333251953, 19.570423126220703, 21.292287826538086, 23.01415252685547, 24.73601722717285, 26.457881927490234, 28.179744720458984, 29.901609420776367, 31.62347412109375, 33.3453369140625, 35.06719970703125, 36.789066314697266, 38.510929107666016, 40.23279571533203, 41.95465850830078, 43.67652130126953, 45.39838790893555, 47.1202507019043, 48.84211730957031, 50.56398010253906]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 4.0, 2.0, 5.0, 7.0, 7.0, 1.0, 11.0, 13.0, 9.0, 12.0, 15.0, 18.0, 20.0, 22.0, 15.0, 28.0, 29.0, 26.0, 26.0, 27.0, 38.0, 33.0, 36.0, 42.0, 45.0, 41.0, 42.0, 30.0, 39.0, 38.0, 26.0, 20.0, 36.0, 23.0, 23.0, 31.0, 18.0, 31.0, 19.0, 16.0, 14.0, 12.0, 6.0, 16.0, 5.0, 8.0, 7.0, 7.0, 8.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.34332275390625, -5.1671142578125, -4.99090576171875, -4.814697265625, -4.63848876953125, -4.4622802734375, -4.28607177734375, -4.10986328125, -3.93365478515625, -3.7574462890625, -3.58123779296875, -3.405029296875, -3.22882080078125, -3.0526123046875, -2.87640380859375, -2.7001953125, -2.52398681640625, -2.3477783203125, -2.17156982421875, -1.995361328125, -1.81915283203125, -1.6429443359375, -1.46673583984375, -1.29052734375, -1.11431884765625, -0.9381103515625, -0.76190185546875, -0.585693359375, -0.40948486328125, -0.2332763671875, -0.05706787109375, 0.119140625, 0.29534912109375, 0.4715576171875, 0.64776611328125, 0.823974609375, 1.00018310546875, 1.1763916015625, 1.35260009765625, 1.52880859375, 1.70501708984375, 1.8812255859375, 2.05743408203125, 2.233642578125, 2.40985107421875, 2.5860595703125, 2.76226806640625, 2.9384765625, 3.11468505859375, 3.2908935546875, 3.46710205078125, 3.643310546875, 3.81951904296875, 3.9957275390625, 4.17193603515625, 4.34814453125, 4.52435302734375, 4.7005615234375, 4.87677001953125, 5.052978515625, 5.22918701171875, 5.4053955078125, 5.58160400390625, 5.7578125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 8.0, 6.0, 7.0, 1.0, 13.0, 15.0, 20.0, 10.0, 23.0, 26.0, 25.0, 25.0, 43.0, 45.0, 94.0, 160.0, 337.0, 1149.0, 9564.0, 568146.0, 3479794.0, 129125.0, 4192.0, 718.0, 239.0, 147.0, 64.0, 50.0, 25.0, 28.0, 25.0, 28.0, 20.0, 23.0, 17.0, 10.0, 11.0, 5.0, 10.0, 8.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.765625, -24.0, -23.234375, -22.46875, -21.703125, -20.9375, -20.171875, -19.40625, -18.640625, -17.875, -17.109375, -16.34375, -15.578125, -14.8125, -14.046875, -13.28125, -12.515625, -11.75, -10.984375, -10.21875, -9.453125, -8.6875, -7.921875, -7.15625, -6.390625, -5.625, -4.859375, -4.09375, -3.328125, -2.5625, -1.796875, -1.03125, -0.265625, 0.5, 1.265625, 2.03125, 2.796875, 3.5625, 4.328125, 5.09375, 5.859375, 6.625, 7.390625, 8.15625, 8.921875, 9.6875, 10.453125, 11.21875, 11.984375, 12.75, 13.515625, 14.28125, 15.046875, 15.8125, 16.578125, 17.34375, 18.109375, 18.875, 19.640625, 20.40625, 21.171875, 21.9375, 22.703125, 23.46875, 24.234375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 4.0, 4.0, 8.0, 11.0, 12.0, 19.0, 24.0, 38.0, 50.0, 86.0, 109.0, 158.0, 198.0, 320.0, 405.0, 483.0, 494.0, 429.0, 346.0, 256.0, 178.0, 136.0, 75.0, 80.0, 53.0, 24.0, 20.0, 20.0, 10.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0546875, -12.6348876953125, -12.215087890625, -11.7952880859375, -11.37548828125, -10.9556884765625, -10.535888671875, -10.1160888671875, -9.6962890625, -9.2764892578125, -8.856689453125, -8.4368896484375, -8.01708984375, -7.5972900390625, -7.177490234375, -6.7576904296875, -6.337890625, -5.9180908203125, -5.498291015625, -5.0784912109375, -4.65869140625, -4.2388916015625, -3.819091796875, -3.3992919921875, -2.9794921875, -2.5596923828125, -2.139892578125, -1.7200927734375, -1.30029296875, -0.8804931640625, -0.460693359375, -0.0408935546875, 0.37890625, 0.7987060546875, 1.218505859375, 1.6383056640625, 2.05810546875, 2.4779052734375, 2.897705078125, 3.3175048828125, 3.7373046875, 4.1571044921875, 4.576904296875, 4.9967041015625, 5.41650390625, 5.8363037109375, 6.256103515625, 6.6759033203125, 7.095703125, 7.5155029296875, 7.935302734375, 8.3551025390625, 8.77490234375, 9.1947021484375, 9.614501953125, 10.0343017578125, 10.4541015625, 10.8739013671875, 11.293701171875, 11.7135009765625, 12.13330078125, 12.5531005859375, 12.972900390625, 13.3927001953125, 13.8125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 3.0, 8.0, 14.0, 10.0, 16.0, 22.0, 36.0, 38.0, 63.0, 84.0, 123.0, 197.0, 318.0, 607.0, 2380.0, 125076.0, 4014798.0, 47505.0, 1659.0, 511.0, 253.0, 146.0, 106.0, 72.0, 70.0, 48.0, 27.0, 22.0, 20.0, 12.0, 9.0, 7.0, 7.0, 7.0, 3.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.96875, -50.41357421875, -48.8583984375, -47.30322265625, -45.748046875, -44.19287109375, -42.6376953125, -41.08251953125, -39.52734375, -37.97216796875, -36.4169921875, -34.86181640625, -33.306640625, -31.75146484375, -30.1962890625, -28.64111328125, -27.0859375, -25.53076171875, -23.9755859375, -22.42041015625, -20.865234375, -19.31005859375, -17.7548828125, -16.19970703125, -14.64453125, -13.08935546875, -11.5341796875, -9.97900390625, -8.423828125, -6.86865234375, -5.3134765625, -3.75830078125, -2.203125, -0.64794921875, 0.9072265625, 2.46240234375, 4.017578125, 5.57275390625, 7.1279296875, 8.68310546875, 10.23828125, 11.79345703125, 13.3486328125, 14.90380859375, 16.458984375, 18.01416015625, 19.5693359375, 21.12451171875, 22.6796875, 24.23486328125, 25.7900390625, 27.34521484375, 28.900390625, 30.45556640625, 32.0107421875, 33.56591796875, 35.12109375, 36.67626953125, 38.2314453125, 39.78662109375, 41.341796875, 42.89697265625, 44.4521484375, 46.00732421875, 47.5625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 26.0, 73.0, 136.0, 237.0, 244.0, 162.0, 88.0, 30.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.61029815673828, -80.12138366699219, -76.63246154785156, -73.14354705810547, -69.65463256835938, -66.16571044921875, -62.676795959472656, -59.18788146972656, -55.6989631652832, -52.210044860839844, -48.72113037109375, -45.23221206665039, -41.74329376220703, -38.25437927246094, -34.76546096801758, -31.27654457092285, -27.787628173828125, -24.2987117767334, -20.809795379638672, -17.320877075195312, -13.831960678100586, -10.34304428100586, -6.8541259765625, -3.3652095794677734, 0.12370681762695312, 3.612623691558838, 7.101540565490723, 10.590457916259766, 14.079374313354492, 17.56829071044922, 21.057209014892578, 24.546125411987305, 28.035049438476562, 31.52396583557129, 35.012882232666016, 38.501800537109375, 41.99071502685547, 45.47963333129883, 48.96855163574219, 52.45746612548828, 55.94638442993164, 59.435302734375, 62.924217224121094, 66.41313171386719, 69.90205383300781, 73.3909683227539, 76.8798828125, 80.36880493164062, 83.85771942138672, 87.34663391113281, 90.83555603027344, 94.32447052001953, 97.81338500976562, 101.30230712890625, 104.79122161865234, 108.28013610839844, 111.76905822753906, 115.25797271728516, 118.74689483642578, 122.23580932617188, 125.72472381591797, 129.21363830566406, 132.7025604248047, 136.1914825439453, 139.68038940429688]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 13.0, 13.0, 7.0, 17.0, 17.0, 17.0, 18.0, 19.0, 28.0, 27.0, 23.0, 23.0, 35.0, 29.0, 42.0, 43.0, 33.0, 45.0, 54.0, 40.0, 49.0, 43.0, 39.0, 33.0, 34.0, 35.0, 23.0, 29.0, 34.0, 9.0, 19.0, 18.0, 15.0, 13.0, 13.0, 7.0, 8.0, 7.0, 4.0, 5.0, 5.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-39.80173110961914, -38.61882781982422, -37.43592834472656, -36.253028869628906, -35.070125579833984, -33.88722229003906, -32.704322814941406, -31.521421432495117, -30.338520050048828, -29.15561866760254, -27.97271728515625, -26.78981590270996, -25.606914520263672, -24.424013137817383, -23.241111755371094, -22.058210372924805, -20.875308990478516, -19.692407608032227, -18.509506225585938, -17.32660484313965, -16.14370346069336, -14.96080207824707, -13.777900695800781, -12.594999313354492, -11.412097930908203, -10.229196548461914, -9.046295166015625, -7.863393783569336, -6.680492401123047, -5.497591018676758, -4.314689636230469, -3.1317882537841797, -1.948883056640625, -0.7659816741943359, 0.4169197082519531, 1.5998210906982422, 2.7827224731445312, 3.9656238555908203, 5.148525238037109, 6.331426620483398, 7.5143280029296875, 8.697229385375977, 9.880130767822266, 11.063032150268555, 12.245933532714844, 13.428834915161133, 14.611736297607422, 15.794637680053711, 16.9775390625, 18.16044044494629, 19.343341827392578, 20.526243209838867, 21.709144592285156, 22.892045974731445, 24.074947357177734, 25.257848739624023, 26.440750122070312, 27.6236515045166, 28.80655288696289, 29.98945426940918, 31.17235565185547, 32.355255126953125, 33.53815841674805, 34.72106170654297, 35.903961181640625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 8.0, 8.0, 11.0, 10.0, 8.0, 17.0, 12.0, 12.0, 23.0, 35.0, 24.0, 19.0, 25.0, 33.0, 34.0, 35.0, 31.0, 26.0, 37.0, 40.0, 39.0, 35.0, 42.0, 46.0, 27.0, 34.0, 30.0, 25.0, 40.0, 25.0, 20.0, 24.0, 22.0, 20.0, 21.0, 16.0, 14.0, 12.0, 11.0, 7.0, 9.0, 4.0, 7.0, 3.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.10284423828125, -4.9322509765625, -4.76165771484375, -4.591064453125, -4.42047119140625, -4.2498779296875, -4.07928466796875, -3.90869140625, -3.73809814453125, -3.5675048828125, -3.39691162109375, -3.226318359375, -3.05572509765625, -2.8851318359375, -2.71453857421875, -2.5439453125, -2.37335205078125, -2.2027587890625, -2.03216552734375, -1.861572265625, -1.69097900390625, -1.5203857421875, -1.34979248046875, -1.17919921875, -1.00860595703125, -0.8380126953125, -0.66741943359375, -0.496826171875, -0.32623291015625, -0.1556396484375, 0.01495361328125, 0.185546875, 0.35614013671875, 0.5267333984375, 0.69732666015625, 0.867919921875, 1.03851318359375, 1.2091064453125, 1.37969970703125, 1.55029296875, 1.72088623046875, 1.8914794921875, 2.06207275390625, 2.232666015625, 2.40325927734375, 2.5738525390625, 2.74444580078125, 2.9150390625, 3.08563232421875, 3.2562255859375, 3.42681884765625, 3.597412109375, 3.76800537109375, 3.9385986328125, 4.10919189453125, 4.27978515625, 4.45037841796875, 4.6209716796875, 4.79156494140625, 4.962158203125, 5.13275146484375, 5.3033447265625, 5.47393798828125, 5.64453125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 5.0, 9.0, 8.0, 13.0, 18.0, 23.0, 41.0, 57.0, 76.0, 110.0, 138.0, 232.0, 343.0, 468.0, 754.0, 1061.0, 1686.0, 2421.0, 3651.0, 5661.0, 8785.0, 13932.0, 22398.0, 36881.0, 62591.0, 108846.0, 177231.0, 212939.0, 155857.0, 92157.0, 54187.0, 31900.0, 19504.0, 12102.0, 7734.0, 4873.0, 3285.0, 2167.0, 1354.0, 956.0, 647.0, 480.0, 291.0, 213.0, 151.0, 107.0, 75.0, 42.0, 35.0, 22.0, 22.0, 10.0, 6.0, 4.0, 5.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.69091796875, -0.6695632934570312, -0.6482086181640625, -0.6268539428710938, -0.605499267578125, -0.5841445922851562, -0.5627899169921875, -0.5414352416992188, -0.52008056640625, -0.49872589111328125, -0.4773712158203125, -0.45601654052734375, -0.434661865234375, -0.41330718994140625, -0.3919525146484375, -0.37059783935546875, -0.3492431640625, -0.32788848876953125, -0.3065338134765625, -0.28517913818359375, -0.263824462890625, -0.24246978759765625, -0.2211151123046875, -0.19976043701171875, -0.17840576171875, -0.15705108642578125, -0.1356964111328125, -0.11434173583984375, -0.092987060546875, -0.07163238525390625, -0.0502777099609375, -0.02892303466796875, -0.007568359375, 0.01378631591796875, 0.0351409912109375, 0.05649566650390625, 0.077850341796875, 0.09920501708984375, 0.1205596923828125, 0.14191436767578125, 0.16326904296875, 0.18462371826171875, 0.2059783935546875, 0.22733306884765625, 0.248687744140625, 0.27004241943359375, 0.2913970947265625, 0.31275177001953125, 0.3341064453125, 0.35546112060546875, 0.3768157958984375, 0.39817047119140625, 0.419525146484375, 0.44087982177734375, 0.4622344970703125, 0.48358917236328125, 0.50494384765625, 0.5262985229492188, 0.5476531982421875, 0.5690078735351562, 0.590362548828125, 0.6117172241210938, 0.6330718994140625, 0.6544265747070312, 0.67578125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 5.0, 6.0, 8.0, 10.0, 17.0, 13.0, 13.0, 26.0, 19.0, 24.0, 34.0, 30.0, 32.0, 49.0, 43.0, 46.0, 31.0, 54.0, 34.0, 1064.0, 29.0, 37.0, 29.0, 35.0, 38.0, 32.0, 39.0, 29.0, 23.0, 25.0, 14.0, 18.0, 20.0, 15.0, 17.0, 10.0, 10.0, 4.0, 7.0, 8.0, 5.0, 2.0, 1.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.708984375, -3.588043212890625, -3.46710205078125, -3.346160888671875, -3.2252197265625, -3.104278564453125, -2.98333740234375, -2.862396240234375, -2.741455078125, -2.620513916015625, -2.49957275390625, -2.378631591796875, -2.2576904296875, -2.136749267578125, -2.01580810546875, -1.894866943359375, -1.77392578125, -1.652984619140625, -1.53204345703125, -1.411102294921875, -1.2901611328125, -1.169219970703125, -1.04827880859375, -0.927337646484375, -0.806396484375, -0.685455322265625, -0.56451416015625, -0.443572998046875, -0.3226318359375, -0.201690673828125, -0.08074951171875, 0.040191650390625, 0.1611328125, 0.282073974609375, 0.40301513671875, 0.523956298828125, 0.6448974609375, 0.765838623046875, 0.88677978515625, 1.007720947265625, 1.128662109375, 1.249603271484375, 1.37054443359375, 1.491485595703125, 1.6124267578125, 1.733367919921875, 1.85430908203125, 1.975250244140625, 2.09619140625, 2.217132568359375, 2.33807373046875, 2.459014892578125, 2.5799560546875, 2.700897216796875, 2.82183837890625, 2.942779541015625, 3.063720703125, 3.184661865234375, 3.30560302734375, 3.426544189453125, 3.5474853515625, 3.668426513671875, 3.78936767578125, 3.910308837890625, 4.03125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 1.0, 6.0, 6.0, 15.0, 20.0, 27.0, 43.0, 62.0, 114.0, 137.0, 220.0, 374.0, 619.0, 923.0, 1429.0, 2259.0, 3683.0, 6027.0, 9947.0, 16786.0, 28739.0, 50335.0, 91130.0, 162063.0, 1281677.0, 188686.0, 108503.0, 60120.0, 33691.0, 19474.0, 11639.0, 7043.0, 4211.0, 2698.0, 1657.0, 1021.0, 604.0, 417.0, 273.0, 154.0, 104.0, 71.0, 36.0, 33.0, 17.0, 16.0, 12.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6572265625, -0.6357803344726562, -0.6143341064453125, -0.5928878784179688, -0.571441650390625, -0.5499954223632812, -0.5285491943359375, -0.5071029663085938, -0.48565673828125, -0.46421051025390625, -0.4427642822265625, -0.42131805419921875, -0.399871826171875, -0.37842559814453125, -0.3569793701171875, -0.33553314208984375, -0.3140869140625, -0.29264068603515625, -0.2711944580078125, -0.24974822998046875, -0.228302001953125, -0.20685577392578125, -0.1854095458984375, -0.16396331787109375, -0.14251708984375, -0.12107086181640625, -0.0996246337890625, -0.07817840576171875, -0.056732177734375, -0.03528594970703125, -0.0138397216796875, 0.00760650634765625, 0.029052734375, 0.05049896240234375, 0.0719451904296875, 0.09339141845703125, 0.114837646484375, 0.13628387451171875, 0.1577301025390625, 0.17917633056640625, 0.20062255859375, 0.22206878662109375, 0.2435150146484375, 0.26496124267578125, 0.286407470703125, 0.30785369873046875, 0.3292999267578125, 0.35074615478515625, 0.3721923828125, 0.39363861083984375, 0.4150848388671875, 0.43653106689453125, 0.457977294921875, 0.47942352294921875, 0.5008697509765625, 0.5223159790039062, 0.54376220703125, 0.5652084350585938, 0.5866546630859375, 0.6081008911132812, 0.629547119140625, 0.6509933471679688, 0.6724395751953125, 0.6938858032226562, 0.71533203125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 7.0, 4.0, 8.0, 11.0, 10.0, 16.0, 16.0, 21.0, 19.0, 25.0, 23.0, 21.0, 38.0, 38.0, 44.0, 35.0, 32.0, 32.0, 46.0, 48.0, 48.0, 47.0, 29.0, 41.0, 49.0, 37.0, 34.0, 29.0, 32.0, 30.0, 25.0, 13.0, 17.0, 17.0, 13.0, 13.0, 10.0, 3.0, 5.0, 5.0, 2.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0012235641479492188, -0.0011805891990661621, -0.0011376142501831055, -0.0010946393013000488, -0.0010516643524169922, -0.0010086894035339355, -0.0009657144546508789, -0.0009227395057678223, -0.0008797645568847656, -0.000836789608001709, -0.0007938146591186523, -0.0007508397102355957, -0.0007078647613525391, -0.0006648898124694824, -0.0006219148635864258, -0.0005789399147033691, -0.0005359649658203125, -0.0004929900169372559, -0.0004500150680541992, -0.0004070401191711426, -0.00036406517028808594, -0.0003210902214050293, -0.00027811527252197266, -0.00023514032363891602, -0.00019216537475585938, -0.00014919042587280273, -0.0001062154769897461, -6.324052810668945e-05, -2.0265579223632812e-05, 2.2709369659423828e-05, 6.568431854248047e-05, 0.00010865926742553711, 0.00015163421630859375, 0.0001946091651916504, 0.00023758411407470703, 0.00028055906295776367, 0.0003235340118408203, 0.00036650896072387695, 0.0004094839096069336, 0.00045245885848999023, 0.0004954338073730469, 0.0005384087562561035, 0.0005813837051391602, 0.0006243586540222168, 0.0006673336029052734, 0.0007103085517883301, 0.0007532835006713867, 0.0007962584495544434, 0.0008392333984375, 0.0008822083473205566, 0.0009251832962036133, 0.0009681582450866699, 0.0010111331939697266, 0.0010541081428527832, 0.0010970830917358398, 0.0011400580406188965, 0.0011830329895019531, 0.0012260079383850098, 0.0012689828872680664, 0.001311957836151123, 0.0013549327850341797, 0.0013979077339172363, 0.001440882682800293, 0.0014838576316833496, 0.0015268325805664062]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 12.0, 11.0, 8.0, 18.0, 26.0, 30.0, 35.0, 41.0, 58.0, 45.0, 75.0, 115.0, 255.0, 592.0, 1530.0, 458957.0, 583623.0, 1677.0, 599.0, 224.0, 142.0, 103.0, 77.0, 48.0, 46.0, 37.0, 23.0, 31.0, 14.0, 13.0, 12.0, 12.0, 10.0, 9.0, 4.0, 6.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.03399658203125, -0.03299736976623535, -0.0319981575012207, -0.030998945236206055, -0.029999732971191406, -0.029000520706176758, -0.02800130844116211, -0.02700209617614746, -0.026002883911132812, -0.025003671646118164, -0.024004459381103516, -0.023005247116088867, -0.02200603485107422, -0.02100682258605957, -0.020007610321044922, -0.019008398056030273, -0.018009185791015625, -0.017009973526000977, -0.016010761260986328, -0.01501154899597168, -0.014012336730957031, -0.013013124465942383, -0.012013912200927734, -0.011014699935913086, -0.010015487670898438, -0.009016275405883789, -0.00801706314086914, -0.007017850875854492, -0.006018638610839844, -0.005019426345825195, -0.004020214080810547, -0.0030210018157958984, -0.00202178955078125, -0.0010225772857666016, -2.3365020751953125e-05, 0.0009758472442626953, 0.0019750595092773438, 0.002974271774291992, 0.003973484039306641, 0.004972696304321289, 0.0059719085693359375, 0.006971120834350586, 0.007970333099365234, 0.008969545364379883, 0.009968757629394531, 0.01096796989440918, 0.011967182159423828, 0.012966394424438477, 0.013965606689453125, 0.014964818954467773, 0.015964031219482422, 0.01696324348449707, 0.01796245574951172, 0.018961668014526367, 0.019960880279541016, 0.020960092544555664, 0.021959304809570312, 0.02295851707458496, 0.02395772933959961, 0.024956941604614258, 0.025956153869628906, 0.026955366134643555, 0.027954578399658203, 0.02895379066467285, 0.0299530029296875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 50.0, 445.0, 449.0, 64.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.008941203355789185, -0.008775648660957813, -0.008610093966126442, -0.00844453927129507, -0.008278983645141125, -0.008113428950309753, -0.007947874255478382, -0.007782319560647011, -0.0076167648658156395, -0.007451210170984268, -0.00728565501049161, -0.007120100315660238, -0.006954545620828867, -0.006788990925997496, -0.006623435765504837, -0.006457881070673466, -0.006292326375842094, -0.006126771681010723, -0.0059612165205180645, -0.005795661825686693, -0.005630107130855322, -0.005464552436023951, -0.005298997275531292, -0.005133442580699921, -0.004967887420207262, -0.004802332725375891, -0.004636777564883232, -0.004471222870051861, -0.0043056681752204895, -0.004140113480389118, -0.00397455831989646, -0.0038090036250650883, -0.0036434484645724297, -0.0034778935369104147, -0.0033123388420790434, -0.0031467839144170284, -0.002981229219585657, -0.002815674291923642, -0.002650119364261627, -0.002484564669430256, -0.0023190099745988846, -0.0021534550469368696, -0.0019879003521054983, -0.0018223454244434834, -0.001656790729612112, -0.001491235801950097, -0.001325680990703404, -0.0011601261794567108, -0.0009945713682100177, -0.0008290165569633245, -0.0006634617457166314, -0.0004979068762622774, -0.00033235206501558423, -0.0001667972537688911, -1.2423843145370483e-06, 0.00016431242693215609, 0.0003298672381788492, 0.0004954220494255424, 0.0006609768606722355, 0.0008265317301265895, 0.0009920864831656218, 0.0011576414108276367, 0.0013231962220743299, 0.001488751033321023, 0.0016543058445677161]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 5.0, 8.0, 3.0, 7.0, 5.0, 7.0, 8.0, 19.0, 18.0, 13.0, 27.0, 24.0, 26.0, 23.0, 26.0, 20.0, 32.0, 42.0, 38.0, 36.0, 49.0, 41.0, 41.0, 39.0, 34.0, 32.0, 35.0, 42.0, 28.0, 38.0, 26.0, 22.0, 23.0, 23.0, 15.0, 22.0, 21.0, 14.0, 14.0, 15.0, 8.0, 9.0, 6.0, 6.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007290244102478027, -0.0007045697420835495, -0.0006801150739192963, -0.000655660405755043, -0.0006312057375907898, -0.0006067510694265366, -0.0005822964012622833, -0.0005578417330980301, -0.0005333870649337769, -0.0005089323967695236, -0.0004844777286052704, -0.00046002306044101715, -0.0004355683922767639, -0.0004111137241125107, -0.00038665905594825745, -0.0003622043877840042, -0.000337749719619751, -0.00031329505145549774, -0.0002888403832912445, -0.00026438571512699127, -0.00023993104696273804, -0.0002154763787984848, -0.00019102171063423157, -0.00016656704246997833, -0.0001421123743057251, -0.00011765770614147186, -9.320303797721863e-05, -6.874836981296539e-05, -4.429370164871216e-05, -1.9839033484458923e-05, 4.6156346797943115e-06, 2.9070302844047546e-05, 5.352497100830078e-05, 7.797963917255402e-05, 0.00010243430733680725, 0.00012688897550106049, 0.00015134364366531372, 0.00017579831182956696, 0.0002002529799938202, 0.00022470764815807343, 0.00024916231632232666, 0.0002736169844865799, 0.00029807165265083313, 0.00032252632081508636, 0.0003469809889793396, 0.00037143565714359283, 0.00039589032530784607, 0.0004203449934720993, 0.00044479966163635254, 0.0004692543298006058, 0.000493708997964859, 0.0005181636661291122, 0.0005426183342933655, 0.0005670730024576187, 0.000591527670621872, 0.0006159823387861252, 0.0006404370069503784, 0.0006648916751146317, 0.0006893463432788849, 0.0007138010114431381, 0.0007382556796073914, 0.0007627103477716446, 0.0007871650159358978, 0.0008116196841001511, 0.0008360743522644043]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 2.0, 4.0, 4.0, 8.0, 8.0, 11.0, 10.0, 8.0, 17.0, 12.0, 12.0, 23.0, 35.0, 24.0, 19.0, 25.0, 33.0, 34.0, 35.0, 31.0, 26.0, 37.0, 40.0, 39.0, 35.0, 42.0, 46.0, 27.0, 34.0, 30.0, 25.0, 40.0, 25.0, 20.0, 24.0, 22.0, 20.0, 21.0, 16.0, 14.0, 12.0, 11.0, 7.0, 9.0, 4.0, 7.0, 3.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.2734375, -5.10284423828125, -4.9322509765625, -4.76165771484375, -4.591064453125, -4.42047119140625, -4.2498779296875, -4.07928466796875, -3.90869140625, -3.73809814453125, -3.5675048828125, -3.39691162109375, -3.226318359375, -3.05572509765625, -2.8851318359375, -2.71453857421875, -2.5439453125, -2.37335205078125, -2.2027587890625, -2.03216552734375, -1.861572265625, -1.69097900390625, -1.5203857421875, -1.34979248046875, -1.17919921875, -1.00860595703125, -0.8380126953125, -0.66741943359375, -0.496826171875, -0.32623291015625, -0.1556396484375, 0.01495361328125, 0.185546875, 0.35614013671875, 0.5267333984375, 0.69732666015625, 0.867919921875, 1.03851318359375, 1.2091064453125, 1.37969970703125, 1.55029296875, 1.72088623046875, 1.8914794921875, 2.06207275390625, 2.232666015625, 2.40325927734375, 2.5738525390625, 2.74444580078125, 2.9150390625, 3.08563232421875, 3.2562255859375, 3.42681884765625, 3.597412109375, 3.76800537109375, 3.9385986328125, 4.10919189453125, 4.27978515625, 4.45037841796875, 4.6209716796875, 4.79156494140625, 4.962158203125, 5.13275146484375, 5.3033447265625, 5.47393798828125, 5.64453125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 6.0, 15.0, 11.0, 27.0, 30.0, 37.0, 66.0, 105.0, 136.0, 238.0, 357.0, 620.0, 1230.0, 2317.0, 5015.0, 10827.0, 25188.0, 66277.0, 217956.0, 472784.0, 157411.0, 50396.0, 20254.0, 8679.0, 4074.0, 1972.0, 1020.0, 562.0, 334.0, 224.0, 120.0, 76.0, 60.0, 31.0, 36.0, 20.0, 14.0, 13.0, 6.0, 3.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.734375, -4.5614013671875, -4.388427734375, -4.2154541015625, -4.04248046875, -3.8695068359375, -3.696533203125, -3.5235595703125, -3.3505859375, -3.1776123046875, -3.004638671875, -2.8316650390625, -2.65869140625, -2.4857177734375, -2.312744140625, -2.1397705078125, -1.966796875, -1.7938232421875, -1.620849609375, -1.4478759765625, -1.27490234375, -1.1019287109375, -0.928955078125, -0.7559814453125, -0.5830078125, -0.4100341796875, -0.237060546875, -0.0640869140625, 0.10888671875, 0.2818603515625, 0.454833984375, 0.6278076171875, 0.80078125, 0.9737548828125, 1.146728515625, 1.3197021484375, 1.49267578125, 1.6656494140625, 1.838623046875, 2.0115966796875, 2.1845703125, 2.3575439453125, 2.530517578125, 2.7034912109375, 2.87646484375, 3.0494384765625, 3.222412109375, 3.3953857421875, 3.568359375, 3.7413330078125, 3.914306640625, 4.0872802734375, 4.26025390625, 4.4332275390625, 4.606201171875, 4.7791748046875, 4.9521484375, 5.1251220703125, 5.298095703125, 5.4710693359375, 5.64404296875, 5.8170166015625, 5.989990234375, 6.1629638671875, 6.3359375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 2.0, 9.0, 13.0, 11.0, 21.0, 15.0, 22.0, 17.0, 23.0, 25.0, 35.0, 38.0, 50.0, 42.0, 40.0, 68.0, 153.0, 1474.0, 393.0, 139.0, 64.0, 58.0, 55.0, 48.0, 34.0, 26.0, 32.0, 18.0, 21.0, 18.0, 17.0, 7.0, 9.0, 5.0, 7.0, 9.0, 8.0, 3.0, 8.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.671875, -20.9716796875, -20.271484375, -19.5712890625, -18.87109375, -18.1708984375, -17.470703125, -16.7705078125, -16.0703125, -15.3701171875, -14.669921875, -13.9697265625, -13.26953125, -12.5693359375, -11.869140625, -11.1689453125, -10.46875, -9.7685546875, -9.068359375, -8.3681640625, -7.66796875, -6.9677734375, -6.267578125, -5.5673828125, -4.8671875, -4.1669921875, -3.466796875, -2.7666015625, -2.06640625, -1.3662109375, -0.666015625, 0.0341796875, 0.734375, 1.4345703125, 2.134765625, 2.8349609375, 3.53515625, 4.2353515625, 4.935546875, 5.6357421875, 6.3359375, 7.0361328125, 7.736328125, 8.4365234375, 9.13671875, 9.8369140625, 10.537109375, 11.2373046875, 11.9375, 12.6376953125, 13.337890625, 14.0380859375, 14.73828125, 15.4384765625, 16.138671875, 16.8388671875, 17.5390625, 18.2392578125, 18.939453125, 19.6396484375, 20.33984375, 21.0400390625, 21.740234375, 22.4404296875, 23.140625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 10.0, 3.0, 9.0, 12.0, 11.0, 19.0, 19.0, 22.0, 42.0, 44.0, 83.0, 79.0, 107.0, 147.0, 270.0, 424.0, 941.0, 11865.0, 3091105.0, 37759.0, 1327.0, 446.0, 255.0, 191.0, 108.0, 102.0, 61.0, 57.0, 34.0, 42.0, 30.0, 23.0, 13.0, 13.0, 8.0, 9.0, 6.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.46875, -49.73046875, -47.9921875, -46.25390625, -44.515625, -42.77734375, -41.0390625, -39.30078125, -37.5625, -35.82421875, -34.0859375, -32.34765625, -30.609375, -28.87109375, -27.1328125, -25.39453125, -23.65625, -21.91796875, -20.1796875, -18.44140625, -16.703125, -14.96484375, -13.2265625, -11.48828125, -9.75, -8.01171875, -6.2734375, -4.53515625, -2.796875, -1.05859375, 0.6796875, 2.41796875, 4.15625, 5.89453125, 7.6328125, 9.37109375, 11.109375, 12.84765625, 14.5859375, 16.32421875, 18.0625, 19.80078125, 21.5390625, 23.27734375, 25.015625, 26.75390625, 28.4921875, 30.23046875, 31.96875, 33.70703125, 35.4453125, 37.18359375, 38.921875, 40.66015625, 42.3984375, 44.13671875, 45.875, 47.61328125, 49.3515625, 51.08984375, 52.828125, 54.56640625, 56.3046875, 58.04296875, 59.78125]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 10.0, 24.0, 68.0, 116.0, 181.0, 221.0, 181.0, 110.0, 61.0, 18.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.17922592163086, -50.85853576660156, -49.537845611572266, -48.21715545654297, -46.89646911621094, -45.57577896118164, -44.255088806152344, -42.93439865112305, -41.61370849609375, -40.29301834106445, -38.972328186035156, -37.65163803100586, -36.33094787597656, -35.01026153564453, -33.689571380615234, -32.36888122558594, -31.04819107055664, -29.727500915527344, -28.406810760498047, -27.086122512817383, -25.765432357788086, -24.44474220275879, -23.124053955078125, -21.803363800048828, -20.48267364501953, -19.161983489990234, -17.841293334960938, -16.520605087280273, -15.199914932250977, -13.87922477722168, -12.5585355758667, -11.237846374511719, -9.917156219482422, -8.596466064453125, -7.2757768630981445, -5.955087184906006, -4.634397506713867, -3.3137078285217285, -1.9930181503295898, -0.6723289489746094, 0.6483612060546875, 1.9690508842468262, 3.289740562438965, 4.6104302406311035, 5.931119918823242, 7.251809597015381, 8.57249927520752, 9.8931884765625, 11.213878631591797, 12.534568786621094, 13.855257987976074, 15.175947189331055, 16.49663734436035, 17.81732749938965, 19.138015747070312, 20.45870590209961, 21.779396057128906, 23.100086212158203, 24.4207763671875, 25.741464614868164, 27.06215476989746, 28.382844924926758, 29.703533172607422, 31.02422332763672, 32.344913482666016]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 2.0, 4.0, 6.0, 6.0, 18.0, 12.0, 11.0, 17.0, 15.0, 20.0, 31.0, 26.0, 43.0, 35.0, 42.0, 34.0, 48.0, 67.0, 40.0, 53.0, 43.0, 47.0, 49.0, 41.0, 38.0, 30.0, 34.0, 18.0, 30.0, 28.0, 17.0, 27.0, 18.0, 14.0, 6.0, 8.0, 8.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.7752685546875, -58.70700454711914, -56.63874435424805, -54.57048034667969, -52.50221633911133, -50.43395233154297, -48.365692138671875, -46.297428131103516, -44.229164123535156, -42.1609001159668, -40.0926399230957, -38.024375915527344, -35.956111907958984, -33.887847900390625, -31.81958770751953, -29.751323699951172, -27.683063507080078, -25.61480140686035, -23.546537399291992, -21.478275299072266, -19.410011291503906, -17.34174919128418, -15.273487091064453, -13.20522403717041, -11.136960983276367, -9.068697929382324, -7.0004353523254395, -4.932172775268555, -2.8639097213745117, -0.7956466674804688, 1.2726154327392578, 3.340878486633301, 5.409141540527344, 7.477404594421387, 9.54566764831543, 11.613929748535156, 13.6821928024292, 15.750455856323242, 17.81871795654297, 19.886981964111328, 21.955244064331055, 24.02350616455078, 26.09177017211914, 28.160032272338867, 30.228294372558594, 32.29655838012695, 34.36482238769531, 36.433082580566406, 38.501346588134766, 40.569610595703125, 42.63787078857422, 44.70613479614258, 46.77439880371094, 48.84265899658203, 50.91092300415039, 52.97918701171875, 55.047447204589844, 57.1157112121582, 59.1839714050293, 61.252235412597656, 63.320499420166016, 65.38876342773438, 67.45702362060547, 69.52528381347656, 71.59355163574219]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 6.0, 4.0, 0.0, 3.0, 5.0, 6.0, 8.0, 11.0, 9.0, 16.0, 11.0, 16.0, 13.0, 15.0, 31.0, 27.0, 22.0, 29.0, 32.0, 25.0, 37.0, 32.0, 43.0, 26.0, 40.0, 33.0, 43.0, 39.0, 44.0, 28.0, 29.0, 36.0, 31.0, 30.0, 20.0, 30.0, 21.0, 19.0, 24.0, 20.0, 10.0, 16.0, 17.0, 7.0, 13.0, 4.0, 6.0, 6.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.98046875, -5.79827880859375, -5.6160888671875, -5.43389892578125, -5.251708984375, -5.06951904296875, -4.8873291015625, -4.70513916015625, -4.52294921875, -4.34075927734375, -4.1585693359375, -3.97637939453125, -3.794189453125, -3.61199951171875, -3.4298095703125, -3.24761962890625, -3.0654296875, -2.88323974609375, -2.7010498046875, -2.51885986328125, -2.336669921875, -2.15447998046875, -1.9722900390625, -1.79010009765625, -1.60791015625, -1.42572021484375, -1.2435302734375, -1.06134033203125, -0.879150390625, -0.69696044921875, -0.5147705078125, -0.33258056640625, -0.150390625, 0.03179931640625, 0.2139892578125, 0.39617919921875, 0.578369140625, 0.76055908203125, 0.9427490234375, 1.12493896484375, 1.30712890625, 1.48931884765625, 1.6715087890625, 1.85369873046875, 2.035888671875, 2.21807861328125, 2.4002685546875, 2.58245849609375, 2.7646484375, 2.94683837890625, 3.1290283203125, 3.31121826171875, 3.493408203125, 3.67559814453125, 3.8577880859375, 4.03997802734375, 4.22216796875, 4.40435791015625, 4.5865478515625, 4.76873779296875, 4.950927734375, 5.13311767578125, 5.3153076171875, 5.49749755859375, 5.6796875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 2.0, 2.0, 3.0, 8.0, 6.0, 11.0, 15.0, 11.0, 18.0, 15.0, 18.0, 17.0, 26.0, 24.0, 34.0, 30.0, 68.0, 134.0, 315.0, 1042.0, 6090.0, 112713.0, 2851848.0, 1190673.0, 27330.0, 2636.0, 628.0, 186.0, 75.0, 39.0, 38.0, 30.0, 15.0, 29.0, 20.0, 17.0, 19.0, 20.0, 12.0, 12.0, 8.0, 7.0, 12.0, 1.0, 6.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.234375, -20.566650390625, -19.89892578125, -19.231201171875, -18.5634765625, -17.895751953125, -17.22802734375, -16.560302734375, -15.892578125, -15.224853515625, -14.55712890625, -13.889404296875, -13.2216796875, -12.553955078125, -11.88623046875, -11.218505859375, -10.55078125, -9.883056640625, -9.21533203125, -8.547607421875, -7.8798828125, -7.212158203125, -6.54443359375, -5.876708984375, -5.208984375, -4.541259765625, -3.87353515625, -3.205810546875, -2.5380859375, -1.870361328125, -1.20263671875, -0.534912109375, 0.1328125, 0.800537109375, 1.46826171875, 2.135986328125, 2.8037109375, 3.471435546875, 4.13916015625, 4.806884765625, 5.474609375, 6.142333984375, 6.81005859375, 7.477783203125, 8.1455078125, 8.813232421875, 9.48095703125, 10.148681640625, 10.81640625, 11.484130859375, 12.15185546875, 12.819580078125, 13.4873046875, 14.155029296875, 14.82275390625, 15.490478515625, 16.158203125, 16.825927734375, 17.49365234375, 18.161376953125, 18.8291015625, 19.496826171875, 20.16455078125, 20.832275390625, 21.5]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 4.0, 4.0, 9.0, 17.0, 16.0, 28.0, 29.0, 38.0, 47.0, 101.0, 119.0, 177.0, 211.0, 284.0, 367.0, 475.0, 452.0, 431.0, 344.0, 255.0, 190.0, 125.0, 104.0, 76.0, 57.0, 31.0, 17.0, 19.0, 18.0, 14.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.3984375, -13.98876953125, -13.5791015625, -13.16943359375, -12.759765625, -12.35009765625, -11.9404296875, -11.53076171875, -11.12109375, -10.71142578125, -10.3017578125, -9.89208984375, -9.482421875, -9.07275390625, -8.6630859375, -8.25341796875, -7.84375, -7.43408203125, -7.0244140625, -6.61474609375, -6.205078125, -5.79541015625, -5.3857421875, -4.97607421875, -4.56640625, -4.15673828125, -3.7470703125, -3.33740234375, -2.927734375, -2.51806640625, -2.1083984375, -1.69873046875, -1.2890625, -0.87939453125, -0.4697265625, -0.06005859375, 0.349609375, 0.75927734375, 1.1689453125, 1.57861328125, 1.98828125, 2.39794921875, 2.8076171875, 3.21728515625, 3.626953125, 4.03662109375, 4.4462890625, 4.85595703125, 5.265625, 5.67529296875, 6.0849609375, 6.49462890625, 6.904296875, 7.31396484375, 7.7236328125, 8.13330078125, 8.54296875, 8.95263671875, 9.3623046875, 9.77197265625, 10.181640625, 10.59130859375, 11.0009765625, 11.41064453125, 11.8203125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 4.0, 10.0, 11.0, 16.0, 26.0, 25.0, 28.0, 43.0, 38.0, 80.0, 110.0, 146.0, 182.0, 241.0, 389.0, 631.0, 2793.0, 163786.0, 3967995.0, 54178.0, 1789.0, 510.0, 311.0, 222.0, 167.0, 133.0, 98.0, 71.0, 55.0, 48.0, 40.0, 29.0, 19.0, 14.0, 14.0, 9.0, 5.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.4375, -36.9814453125, -35.525390625, -34.0693359375, -32.61328125, -31.1572265625, -29.701171875, -28.2451171875, -26.7890625, -25.3330078125, -23.876953125, -22.4208984375, -20.96484375, -19.5087890625, -18.052734375, -16.5966796875, -15.140625, -13.6845703125, -12.228515625, -10.7724609375, -9.31640625, -7.8603515625, -6.404296875, -4.9482421875, -3.4921875, -2.0361328125, -0.580078125, 0.8759765625, 2.33203125, 3.7880859375, 5.244140625, 6.7001953125, 8.15625, 9.6123046875, 11.068359375, 12.5244140625, 13.98046875, 15.4365234375, 16.892578125, 18.3486328125, 19.8046875, 21.2607421875, 22.716796875, 24.1728515625, 25.62890625, 27.0849609375, 28.541015625, 29.9970703125, 31.453125, 32.9091796875, 34.365234375, 35.8212890625, 37.27734375, 38.7333984375, 40.189453125, 41.6455078125, 43.1015625, 44.5576171875, 46.013671875, 47.4697265625, 48.92578125, 50.3818359375, 51.837890625, 53.2939453125, 54.75]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 22.0, 58.0, 171.0, 259.0, 247.0, 173.0, 65.0, 14.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.51522827148438, -144.6968994140625, -140.87857055664062, -137.06024169921875, -133.24191284179688, -129.423583984375, -125.60525512695312, -121.78692626953125, -117.96859741210938, -114.1502685546875, -110.33193969726562, -106.51361083984375, -102.69528198242188, -98.876953125, -95.05862426757812, -91.24029541015625, -87.4219741821289, -83.60364532470703, -79.78531646728516, -75.96698760986328, -72.1486587524414, -68.33032989501953, -64.51200866699219, -60.69367599487305, -56.87534713745117, -53.0570182800293, -49.23868942260742, -45.42036437988281, -41.60203552246094, -37.78370666503906, -33.96537780761719, -30.147048950195312, -26.328712463378906, -22.51038360595703, -18.692054748535156, -14.873727798461914, -11.055398941040039, -7.237070083618164, -3.418743133544922, 0.3995857238769531, 4.217914581298828, 8.036243438720703, 11.854571342468262, 15.67289924621582, 19.491228103637695, 23.30955696105957, 27.127883911132812, 30.946212768554688, 34.76454162597656, 38.58287048339844, 42.40119934082031, 46.21952819824219, 50.03785705566406, 53.85618591308594, 57.67451095581055, 61.49283981323242, 65.31117248535156, 69.12950134277344, 72.94783020019531, 76.76615905761719, 80.58448791503906, 84.40281677246094, 88.22114562988281, 92.03947448730469, 95.85779571533203]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 5.0, 8.0, 10.0, 9.0, 10.0, 7.0, 11.0, 18.0, 19.0, 23.0, 16.0, 23.0, 28.0, 24.0, 28.0, 35.0, 35.0, 36.0, 37.0, 36.0, 36.0, 41.0, 42.0, 43.0, 45.0, 39.0, 37.0, 32.0, 32.0, 27.0, 24.0, 21.0, 12.0, 19.0, 28.0, 18.0, 13.0, 8.0, 15.0, 13.0, 13.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.14024353027344, -36.944583892822266, -35.74892044067383, -34.553260803222656, -33.35759735107422, -32.16193771362305, -30.966276168823242, -29.770614624023438, -28.574953079223633, -27.379291534423828, -26.183629989624023, -24.98796844482422, -23.792308807373047, -22.59664535522461, -21.400985717773438, -20.205324172973633, -19.009662628173828, -17.814001083374023, -16.61833953857422, -15.42267894744873, -14.227017402648926, -13.031355857849121, -11.835695266723633, -10.640033721923828, -9.444372177124023, -8.248710632324219, -7.053049564361572, -5.857388496398926, -4.661726951599121, -3.4660654067993164, -2.27040433883667, -1.0747432708740234, 0.12091827392578125, 1.3165795803070068, 2.5122408866882324, 3.707902193069458, 4.903563499450684, 6.099225044250488, 7.294886112213135, 8.490547180175781, 9.686208724975586, 10.88187026977539, 12.077531814575195, 13.273192405700684, 14.468853950500488, 15.664515495300293, 16.86017608642578, 18.055837631225586, 19.25149917602539, 20.447160720825195, 21.642822265625, 22.838483810424805, 24.03414535522461, 25.22980499267578, 26.425466537475586, 27.62112808227539, 28.816789627075195, 30.012451171875, 31.208112716674805, 32.40377426147461, 33.59943389892578, 34.79509735107422, 35.99075698852539, 37.18641662597656, 38.382080078125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 6.0, 3.0, 6.0, 6.0, 4.0, 10.0, 3.0, 10.0, 8.0, 12.0, 15.0, 14.0, 13.0, 15.0, 27.0, 25.0, 26.0, 38.0, 18.0, 42.0, 30.0, 35.0, 33.0, 47.0, 40.0, 28.0, 29.0, 34.0, 33.0, 42.0, 31.0, 36.0, 32.0, 29.0, 23.0, 31.0, 23.0, 27.0, 13.0, 15.0, 12.0, 20.0, 13.0, 8.0, 7.0, 3.0, 9.0, 6.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.21484375, -5.04010009765625, -4.8653564453125, -4.69061279296875, -4.515869140625, -4.34112548828125, -4.1663818359375, -3.99163818359375, -3.81689453125, -3.64215087890625, -3.4674072265625, -3.29266357421875, -3.117919921875, -2.94317626953125, -2.7684326171875, -2.59368896484375, -2.4189453125, -2.24420166015625, -2.0694580078125, -1.89471435546875, -1.719970703125, -1.54522705078125, -1.3704833984375, -1.19573974609375, -1.02099609375, -0.84625244140625, -0.6715087890625, -0.49676513671875, -0.322021484375, -0.14727783203125, 0.0274658203125, 0.20220947265625, 0.376953125, 0.55169677734375, 0.7264404296875, 0.90118408203125, 1.075927734375, 1.25067138671875, 1.4254150390625, 1.60015869140625, 1.77490234375, 1.94964599609375, 2.1243896484375, 2.29913330078125, 2.473876953125, 2.64862060546875, 2.8233642578125, 2.99810791015625, 3.1728515625, 3.34759521484375, 3.5223388671875, 3.69708251953125, 3.871826171875, 4.04656982421875, 4.2213134765625, 4.39605712890625, 4.57080078125, 4.74554443359375, 4.9202880859375, 5.09503173828125, 5.269775390625, 5.44451904296875, 5.6192626953125, 5.79400634765625, 5.96875]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 11.0, 6.0, 6.0, 20.0, 31.0, 52.0, 69.0, 85.0, 165.0, 218.0, 377.0, 552.0, 855.0, 1391.0, 2201.0, 3707.0, 5836.0, 9866.0, 17101.0, 29566.0, 53616.0, 104182.0, 201989.0, 262746.0, 165627.0, 83737.0, 44013.0, 24607.0, 14103.0, 8285.0, 5189.0, 3123.0, 1897.0, 1232.0, 724.0, 498.0, 310.0, 213.0, 103.0, 91.0, 58.0, 46.0, 19.0, 15.0, 8.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.755859375, -0.72918701171875, -0.7025146484375, -0.67584228515625, -0.649169921875, -0.62249755859375, -0.5958251953125, -0.56915283203125, -0.54248046875, -0.51580810546875, -0.4891357421875, -0.46246337890625, -0.435791015625, -0.40911865234375, -0.3824462890625, -0.35577392578125, -0.3291015625, -0.30242919921875, -0.2757568359375, -0.24908447265625, -0.222412109375, -0.19573974609375, -0.1690673828125, -0.14239501953125, -0.11572265625, -0.08905029296875, -0.0623779296875, -0.03570556640625, -0.009033203125, 0.01763916015625, 0.0443115234375, 0.07098388671875, 0.09765625, 0.12432861328125, 0.1510009765625, 0.17767333984375, 0.204345703125, 0.23101806640625, 0.2576904296875, 0.28436279296875, 0.31103515625, 0.33770751953125, 0.3643798828125, 0.39105224609375, 0.417724609375, 0.44439697265625, 0.4710693359375, 0.49774169921875, 0.5244140625, 0.55108642578125, 0.5777587890625, 0.60443115234375, 0.631103515625, 0.65777587890625, 0.6844482421875, 0.71112060546875, 0.73779296875, 0.76446533203125, 0.7911376953125, 0.81781005859375, 0.844482421875, 0.87115478515625, 0.8978271484375, 0.92449951171875, 0.951171875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 10.0, 5.0, 6.0, 7.0, 7.0, 12.0, 14.0, 9.0, 16.0, 16.0, 21.0, 26.0, 30.0, 31.0, 18.0, 36.0, 24.0, 36.0, 44.0, 42.0, 33.0, 29.0, 1061.0, 33.0, 50.0, 34.0, 33.0, 38.0, 29.0, 33.0, 32.0, 30.0, 17.0, 29.0, 16.0, 16.0, 21.0, 8.0, 12.0, 12.0, 6.0, 6.0, 12.0, 7.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0], "bins": [-3.724609375, -3.609344482421875, -3.49407958984375, -3.378814697265625, -3.2635498046875, -3.148284912109375, -3.03302001953125, -2.917755126953125, -2.802490234375, -2.687225341796875, -2.57196044921875, -2.456695556640625, -2.3414306640625, -2.226165771484375, -2.11090087890625, -1.995635986328125, -1.88037109375, -1.765106201171875, -1.64984130859375, -1.534576416015625, -1.4193115234375, -1.304046630859375, -1.18878173828125, -1.073516845703125, -0.958251953125, -0.842987060546875, -0.72772216796875, -0.612457275390625, -0.4971923828125, -0.381927490234375, -0.26666259765625, -0.151397705078125, -0.0361328125, 0.079132080078125, 0.19439697265625, 0.309661865234375, 0.4249267578125, 0.540191650390625, 0.65545654296875, 0.770721435546875, 0.885986328125, 1.001251220703125, 1.11651611328125, 1.231781005859375, 1.3470458984375, 1.462310791015625, 1.57757568359375, 1.692840576171875, 1.80810546875, 1.923370361328125, 2.03863525390625, 2.153900146484375, 2.2691650390625, 2.384429931640625, 2.49969482421875, 2.614959716796875, 2.730224609375, 2.845489501953125, 2.96075439453125, 3.076019287109375, 3.1912841796875, 3.306549072265625, 3.42181396484375, 3.537078857421875, 3.65234375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 5.0, 15.0, 11.0, 23.0, 47.0, 38.0, 63.0, 100.0, 172.0, 243.0, 382.0, 603.0, 842.0, 1369.0, 2084.0, 3107.0, 4898.0, 7353.0, 11442.0, 17463.0, 27944.0, 44255.0, 72290.0, 117927.0, 175734.0, 1237514.0, 139238.0, 86718.0, 53181.0, 32987.0, 20641.0, 13115.0, 8664.0, 5671.0, 3802.0, 2438.0, 1578.0, 1023.0, 745.0, 458.0, 314.0, 213.0, 135.0, 78.0, 61.0, 46.0, 36.0, 13.0, 16.0, 10.0, 6.0, 9.0, 4.0, 1.0, 1.0, 4.0], "bins": [-0.6279296875, -0.6090087890625, -0.590087890625, -0.5711669921875, -0.55224609375, -0.5333251953125, -0.514404296875, -0.4954833984375, -0.4765625, -0.4576416015625, -0.438720703125, -0.4197998046875, -0.40087890625, -0.3819580078125, -0.363037109375, -0.3441162109375, -0.3251953125, -0.3062744140625, -0.287353515625, -0.2684326171875, -0.24951171875, -0.2305908203125, -0.211669921875, -0.1927490234375, -0.173828125, -0.1549072265625, -0.135986328125, -0.1170654296875, -0.09814453125, -0.0792236328125, -0.060302734375, -0.0413818359375, -0.0224609375, -0.0035400390625, 0.015380859375, 0.0343017578125, 0.05322265625, 0.0721435546875, 0.091064453125, 0.1099853515625, 0.12890625, 0.1478271484375, 0.166748046875, 0.1856689453125, 0.20458984375, 0.2235107421875, 0.242431640625, 0.2613525390625, 0.2802734375, 0.2991943359375, 0.318115234375, 0.3370361328125, 0.35595703125, 0.3748779296875, 0.393798828125, 0.4127197265625, 0.431640625, 0.4505615234375, 0.469482421875, 0.4884033203125, 0.50732421875, 0.5262451171875, 0.545166015625, 0.5640869140625, 0.5830078125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 3.0, 10.0, 18.0, 12.0, 16.0, 15.0, 22.0, 26.0, 19.0, 36.0, 29.0, 50.0, 54.0, 46.0, 58.0, 47.0, 53.0, 58.0, 61.0, 44.0, 51.0, 43.0, 32.0, 23.0, 29.0, 30.0, 18.0, 20.0, 11.0, 13.0, 13.0, 8.0, 13.0, 1.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016813278198242188, -0.001618310809135437, -0.0015552937984466553, -0.0014922767877578735, -0.0014292597770690918, -0.00136624276638031, -0.0013032257556915283, -0.0012402087450027466, -0.0011771917343139648, -0.001114174723625183, -0.0010511577129364014, -0.0009881407022476196, -0.0009251236915588379, -0.0008621066808700562, -0.0007990896701812744, -0.0007360726594924927, -0.0006730556488037109, -0.0006100386381149292, -0.0005470216274261475, -0.0004840046167373657, -0.000420987606048584, -0.00035797059535980225, -0.0002949535846710205, -0.00023193657398223877, -0.00016891956329345703, -0.00010590255260467529, -4.2885541915893555e-05, 2.0131468772888184e-05, 8.314847946166992e-05, 0.00014616549015045166, 0.0002091825008392334, 0.00027219951152801514, 0.0003352165222167969, 0.0003982335329055786, 0.00046125054359436035, 0.0005242675542831421, 0.0005872845649719238, 0.0006503015756607056, 0.0007133185863494873, 0.000776335597038269, 0.0008393526077270508, 0.0009023696184158325, 0.0009653866291046143, 0.001028403639793396, 0.0010914206504821777, 0.0011544376611709595, 0.0012174546718597412, 0.001280471682548523, 0.0013434886932373047, 0.0014065057039260864, 0.0014695227146148682, 0.00153253972530365, 0.0015955567359924316, 0.0016585737466812134, 0.0017215907573699951, 0.0017846077680587769, 0.0018476247787475586, 0.0019106417894363403, 0.001973658800125122, 0.002036675810813904, 0.0020996928215026855, 0.0021627098321914673, 0.002225726842880249, 0.0022887438535690308, 0.0023517608642578125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 8.0, 2.0, 5.0, 13.0, 14.0, 17.0, 14.0, 15.0, 14.0, 39.0, 36.0, 48.0, 47.0, 63.0, 94.0, 135.0, 321.0, 771.0, 4474.0, 1033018.0, 7571.0, 857.0, 338.0, 165.0, 89.0, 95.0, 56.0, 51.0, 27.0, 32.0, 17.0, 22.0, 15.0, 12.0, 12.0, 10.0, 10.0, 4.0, 8.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0], "bins": [-0.0484619140625, -0.04717111587524414, -0.04588031768798828, -0.04458951950073242, -0.04329872131347656, -0.0420079231262207, -0.040717124938964844, -0.039426326751708984, -0.038135528564453125, -0.036844730377197266, -0.035553932189941406, -0.03426313400268555, -0.03297233581542969, -0.03168153762817383, -0.03039073944091797, -0.02909994125366211, -0.02780914306640625, -0.02651834487915039, -0.02522754669189453, -0.023936748504638672, -0.022645950317382812, -0.021355152130126953, -0.020064353942871094, -0.018773555755615234, -0.017482757568359375, -0.016191959381103516, -0.014901161193847656, -0.013610363006591797, -0.012319564819335938, -0.011028766632080078, -0.009737968444824219, -0.00844717025756836, -0.0071563720703125, -0.005865573883056641, -0.004574775695800781, -0.003283977508544922, -0.0019931793212890625, -0.0007023811340332031, 0.0005884170532226562, 0.0018792152404785156, 0.003170013427734375, 0.004460811614990234, 0.005751609802246094, 0.007042407989501953, 0.008333206176757812, 0.009624004364013672, 0.010914802551269531, 0.01220560073852539, 0.01349639892578125, 0.01478719711303711, 0.01607799530029297, 0.017368793487548828, 0.018659591674804688, 0.019950389862060547, 0.021241188049316406, 0.022531986236572266, 0.023822784423828125, 0.025113582611083984, 0.026404380798339844, 0.027695178985595703, 0.028985977172851562, 0.030276775360107422, 0.03156757354736328, 0.03285837173461914, 0.034149169921875]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 13.0, 571.0, 426.0, 5.0, 3.0, 0.0, 1.0], "bins": [-0.018662385642528534, -0.018345650285482407, -0.01802891492843628, -0.017712179571390152, -0.017395444214344025, -0.017078708857297897, -0.01676197536289692, -0.016445240005850792, -0.016128504648804665, -0.015811769291758537, -0.01549503393471241, -0.015178299508988857, -0.01486156415194273, -0.014544828794896603, -0.014228093437850475, -0.013911358080804348, -0.01359462272375822, -0.013277887366712093, -0.012961152009665966, -0.012644417583942413, -0.012327682226896286, -0.012010946869850159, -0.011694211512804031, -0.011377476155757904, -0.011060740798711777, -0.01074400544166565, -0.010427270084619522, -0.01011053565889597, -0.009793800301849842, -0.009477064944803715, -0.009160329587757587, -0.00884359423071146, -0.008526858873665333, -0.008210123516619205, -0.007893388159573078, -0.007576653268188238, -0.007259918376803398, -0.006943183019757271, -0.0066264476627111435, -0.006309712305665016, -0.0059929778799414635, -0.005676242522895336, -0.005359507631510496, -0.005042772274464369, -0.004726037383079529, -0.0044093020260334015, -0.004092566668987274, -0.0037758315447717905, -0.003459096187725663, -0.0031423610635101795, -0.002825625706464052, -0.0025088905822485685, -0.002192155458033085, -0.0018754203338176012, -0.0015586850931867957, -0.0012419498525559902, -0.0009252147283405066, -0.000608479545917362, -0.0002917443634942174, 2.4990818928927183e-05, 0.00034172600135207176, 0.0006584611255675554, 0.0009751963661983609, 0.0012919316068291664, 0.00160866673104465]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 6.0, 11.0, 3.0, 5.0, 6.0, 6.0, 17.0, 22.0, 14.0, 18.0, 19.0, 25.0, 28.0, 29.0, 37.0, 37.0, 24.0, 44.0, 48.0, 49.0, 52.0, 44.0, 47.0, 33.0, 28.0, 42.0, 42.0, 36.0, 31.0, 24.0, 20.0, 25.0, 23.0, 22.0, 21.0, 15.0, 14.0, 12.0, 7.0, 4.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011348724365234375, -0.0011007599532604218, -0.001066647469997406, -0.0010325349867343903, -0.0009984225034713745, -0.0009643100202083588, -0.000930197536945343, -0.0008960850536823273, -0.0008619725704193115, -0.0008278600871562958, -0.00079374760389328, -0.0007596351206302643, -0.0007255226373672485, -0.0006914101541042328, -0.000657297670841217, -0.0006231851875782013, -0.0005890727043151855, -0.0005549602210521698, -0.000520847737789154, -0.0004867352545261383, -0.00045262277126312256, -0.0004185102880001068, -0.00038439780473709106, -0.0003502853214740753, -0.00031617283821105957, -0.0002820603549480438, -0.0002479478716850281, -0.00021383538842201233, -0.00017972290515899658, -0.00014561042189598083, -0.00011149793863296509, -7.738545536994934e-05, -4.3272972106933594e-05, -9.160488843917847e-06, 2.49519944190979e-05, 5.906447768211365e-05, 9.31769609451294e-05, 0.00012728944420814514, 0.0001614019274711609, 0.00019551441073417664, 0.00022962689399719238, 0.00026373937726020813, 0.0002978518605232239, 0.0003319643437862396, 0.00036607682704925537, 0.0004001893103122711, 0.00043430179357528687, 0.0004684142768383026, 0.0005025267601013184, 0.0005366392433643341, 0.0005707517266273499, 0.0006048642098903656, 0.0006389766931533813, 0.0006730891764163971, 0.0007072016596794128, 0.0007413141429424286, 0.0007754266262054443, 0.0008095391094684601, 0.0008436515927314758, 0.0008777640759944916, 0.0009118765592575073, 0.0009459890425205231, 0.0009801015257835388, 0.0010142140090465546, 0.0010483264923095703]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 1.0, 6.0, 3.0, 6.0, 6.0, 4.0, 10.0, 3.0, 10.0, 8.0, 12.0, 15.0, 14.0, 13.0, 15.0, 26.0, 25.0, 27.0, 35.0, 21.0, 42.0, 29.0, 36.0, 32.0, 47.0, 41.0, 28.0, 29.0, 33.0, 34.0, 41.0, 32.0, 36.0, 32.0, 29.0, 23.0, 30.0, 24.0, 26.0, 12.0, 17.0, 12.0, 20.0, 13.0, 8.0, 7.0, 3.0, 9.0, 6.0, 6.0, 2.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.21875, -5.0439453125, -4.869140625, -4.6943359375, -4.51953125, -4.3447265625, -4.169921875, -3.9951171875, -3.8203125, -3.6455078125, -3.470703125, -3.2958984375, -3.12109375, -2.9462890625, -2.771484375, -2.5966796875, -2.421875, -2.2470703125, -2.072265625, -1.8974609375, -1.72265625, -1.5478515625, -1.373046875, -1.1982421875, -1.0234375, -0.8486328125, -0.673828125, -0.4990234375, -0.32421875, -0.1494140625, 0.025390625, 0.2001953125, 0.375, 0.5498046875, 0.724609375, 0.8994140625, 1.07421875, 1.2490234375, 1.423828125, 1.5986328125, 1.7734375, 1.9482421875, 2.123046875, 2.2978515625, 2.47265625, 2.6474609375, 2.822265625, 2.9970703125, 3.171875, 3.3466796875, 3.521484375, 3.6962890625, 3.87109375, 4.0458984375, 4.220703125, 4.3955078125, 4.5703125, 4.7451171875, 4.919921875, 5.0947265625, 5.26953125, 5.4443359375, 5.619140625, 5.7939453125, 5.96875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 12.0, 16.0, 28.0, 25.0, 35.0, 44.0, 58.0, 94.0, 110.0, 121.0, 199.0, 270.0, 401.0, 603.0, 951.0, 1435.0, 2290.0, 3652.0, 6249.0, 11147.0, 21415.0, 46516.0, 116763.0, 318122.0, 310137.0, 113752.0, 45787.0, 21111.0, 10965.0, 6088.0, 3535.0, 2159.0, 1463.0, 990.0, 588.0, 417.0, 261.0, 175.0, 144.0, 108.0, 84.0, 70.0, 52.0, 31.0, 17.0, 22.0, 15.0, 15.0, 5.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.708984375, -3.585296630859375, -3.46160888671875, -3.337921142578125, -3.2142333984375, -3.090545654296875, -2.96685791015625, -2.843170166015625, -2.719482421875, -2.595794677734375, -2.47210693359375, -2.348419189453125, -2.2247314453125, -2.101043701171875, -1.97735595703125, -1.853668212890625, -1.72998046875, -1.606292724609375, -1.48260498046875, -1.358917236328125, -1.2352294921875, -1.111541748046875, -0.98785400390625, -0.864166259765625, -0.740478515625, -0.616790771484375, -0.49310302734375, -0.369415283203125, -0.2457275390625, -0.122039794921875, 0.00164794921875, 0.125335693359375, 0.2490234375, 0.372711181640625, 0.49639892578125, 0.620086669921875, 0.7437744140625, 0.867462158203125, 0.99114990234375, 1.114837646484375, 1.238525390625, 1.362213134765625, 1.48590087890625, 1.609588623046875, 1.7332763671875, 1.856964111328125, 1.98065185546875, 2.104339599609375, 2.22802734375, 2.351715087890625, 2.47540283203125, 2.599090576171875, 2.7227783203125, 2.846466064453125, 2.97015380859375, 3.093841552734375, 3.217529296875, 3.341217041015625, 3.46490478515625, 3.588592529296875, 3.7122802734375, 3.835968017578125, 3.95965576171875, 4.083343505859375, 4.20703125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 5.0, 0.0, 2.0, 5.0, 6.0, 7.0, 9.0, 13.0, 15.0, 17.0, 11.0, 31.0, 32.0, 28.0, 50.0, 45.0, 41.0, 47.0, 76.0, 90.0, 204.0, 1675.0, 156.0, 71.0, 61.0, 50.0, 51.0, 38.0, 37.0, 34.0, 31.0, 18.0, 25.0, 20.0, 13.0, 8.0, 4.0, 5.0, 10.0, 7.0, 2.0, 4.0, 1.0, 2.0], "bins": [-30.203125, -29.47216796875, -28.7412109375, -28.01025390625, -27.279296875, -26.54833984375, -25.8173828125, -25.08642578125, -24.35546875, -23.62451171875, -22.8935546875, -22.16259765625, -21.431640625, -20.70068359375, -19.9697265625, -19.23876953125, -18.5078125, -17.77685546875, -17.0458984375, -16.31494140625, -15.583984375, -14.85302734375, -14.1220703125, -13.39111328125, -12.66015625, -11.92919921875, -11.1982421875, -10.46728515625, -9.736328125, -9.00537109375, -8.2744140625, -7.54345703125, -6.8125, -6.08154296875, -5.3505859375, -4.61962890625, -3.888671875, -3.15771484375, -2.4267578125, -1.69580078125, -0.96484375, -0.23388671875, 0.4970703125, 1.22802734375, 1.958984375, 2.68994140625, 3.4208984375, 4.15185546875, 4.8828125, 5.61376953125, 6.3447265625, 7.07568359375, 7.806640625, 8.53759765625, 9.2685546875, 9.99951171875, 10.73046875, 11.46142578125, 12.1923828125, 12.92333984375, 13.654296875, 14.38525390625, 15.1162109375, 15.84716796875, 16.578125]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 6.0, 7.0, 19.0, 23.0, 58.0, 78.0, 166.0, 338.0, 740.0, 40172.0, 3102185.0, 1044.0, 390.0, 197.0, 110.0, 64.0, 38.0, 28.0, 15.0, 11.0, 10.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.0, -117.955078125, -113.91015625, -109.865234375, -105.8203125, -101.775390625, -97.73046875, -93.685546875, -89.640625, -85.595703125, -81.55078125, -77.505859375, -73.4609375, -69.416015625, -65.37109375, -61.326171875, -57.28125, -53.236328125, -49.19140625, -45.146484375, -41.1015625, -37.056640625, -33.01171875, -28.966796875, -24.921875, -20.876953125, -16.83203125, -12.787109375, -8.7421875, -4.697265625, -0.65234375, 3.392578125, 7.4375, 11.482421875, 15.52734375, 19.572265625, 23.6171875, 27.662109375, 31.70703125, 35.751953125, 39.796875, 43.841796875, 47.88671875, 51.931640625, 55.9765625, 60.021484375, 64.06640625, 68.111328125, 72.15625, 76.201171875, 80.24609375, 84.291015625, 88.3359375, 92.380859375, 96.42578125, 100.470703125, 104.515625, 108.560546875, 112.60546875, 116.650390625, 120.6953125, 124.740234375, 128.78515625, 132.830078125, 136.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 114.0, 904.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.190673828125, -26.357084274291992, -14.523494720458984, -2.6899032592773438, 9.143684387207031, 20.977272033691406, 32.81086730957031, 44.64445495605469, 56.47804260253906, 68.31163024902344, 80.14521789550781, 91.97881317138672, 103.8124008178711, 115.64598846435547, 127.47958374023438, 139.31317138671875, 151.14675903320312, 162.9803466796875, 174.81393432617188, 186.64752197265625, 198.48110961914062, 210.314697265625, 222.14830017089844, 233.9818878173828, 245.8154754638672, 257.6490783691406, 269.482666015625, 281.3162536621094, 293.14984130859375, 304.9834289550781, 316.8170166015625, 328.6506042480469, 340.48419189453125, 352.3177795410156, 364.1513671875, 375.9849548339844, 387.81854248046875, 399.6521301269531, 411.4857177734375, 423.3193359375, 435.15289306640625, 446.9864807128906, 458.820068359375, 470.6536560058594, 482.48724365234375, 494.3208312988281, 506.1544189453125, 517.988037109375, 529.8216552734375, 541.6552734375, 553.4888305664062, 565.3224487304688, 577.156005859375, 588.9896240234375, 600.8231811523438, 612.6567993164062, 624.4903564453125, 636.323974609375, 648.1575317382812, 659.9911499023438, 671.82470703125, 683.6583251953125, 695.4918823242188, 707.3255004882812, 719.1590576171875]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 2.0, 5.0, 4.0, 4.0, 4.0, 8.0, 15.0, 11.0, 27.0, 29.0, 25.0, 26.0, 25.0, 30.0, 39.0, 41.0, 42.0, 32.0, 47.0, 34.0, 37.0, 57.0, 44.0, 51.0, 33.0, 41.0, 29.0, 35.0, 30.0, 24.0, 21.0, 25.0, 20.0, 15.0, 17.0, 11.0, 11.0, 9.0, 9.0, 4.0, 3.0, 6.0, 9.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-70.67227935791016, -68.69947814941406, -66.72667694091797, -64.75387573242188, -62.78107452392578, -60.80827331542969, -58.83546829223633, -56.862667083740234, -54.88986587524414, -52.91706466674805, -50.94426345825195, -48.97146224975586, -46.9986572265625, -45.025856018066406, -43.05305480957031, -41.08025360107422, -39.107452392578125, -37.13465118408203, -35.16184997558594, -33.189048767089844, -31.216245651245117, -29.243444442749023, -27.270641326904297, -25.297840118408203, -23.32503890991211, -21.352237701416016, -19.379436492919922, -17.406633377075195, -15.433832168579102, -13.461030960083008, -11.488228797912598, -9.515426635742188, -7.542625427246094, -5.569823741912842, -3.59702205657959, -1.624220371246338, 0.34858131408691406, 2.321382522583008, 4.294184684753418, 6.266986846923828, 8.239788055419922, 10.212589263916016, 12.185391426086426, 14.158193588256836, 16.13099479675293, 18.103796005249023, 20.07659912109375, 22.049400329589844, 24.022201538085938, 25.99500274658203, 27.967803955078125, 29.94060707092285, 31.913408279418945, 33.886207580566406, 35.859012603759766, 37.83181381225586, 39.80461502075195, 41.77741622924805, 43.75021743774414, 45.723018646240234, 47.695823669433594, 49.66862487792969, 51.64142608642578, 53.614227294921875, 55.58702850341797]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 4.0, 3.0, 1.0, 5.0, 9.0, 4.0, 4.0, 8.0, 9.0, 8.0, 14.0, 10.0, 12.0, 17.0, 20.0, 25.0, 29.0, 31.0, 28.0, 31.0, 28.0, 38.0, 45.0, 36.0, 41.0, 30.0, 46.0, 38.0, 35.0, 41.0, 26.0, 31.0, 42.0, 31.0, 21.0, 22.0, 32.0, 18.0, 22.0, 20.0, 16.0, 15.0, 12.0, 8.0, 9.0, 3.0, 9.0, 8.0, 5.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.94140625, -5.74554443359375, -5.5496826171875, -5.35382080078125, -5.157958984375, -4.96209716796875, -4.7662353515625, -4.57037353515625, -4.37451171875, -4.17864990234375, -3.9827880859375, -3.78692626953125, -3.591064453125, -3.39520263671875, -3.1993408203125, -3.00347900390625, -2.8076171875, -2.61175537109375, -2.4158935546875, -2.22003173828125, -2.024169921875, -1.82830810546875, -1.6324462890625, -1.43658447265625, -1.24072265625, -1.04486083984375, -0.8489990234375, -0.65313720703125, -0.457275390625, -0.26141357421875, -0.0655517578125, 0.13031005859375, 0.326171875, 0.52203369140625, 0.7178955078125, 0.91375732421875, 1.109619140625, 1.30548095703125, 1.5013427734375, 1.69720458984375, 1.89306640625, 2.08892822265625, 2.2847900390625, 2.48065185546875, 2.676513671875, 2.87237548828125, 3.0682373046875, 3.26409912109375, 3.4599609375, 3.65582275390625, 3.8516845703125, 4.04754638671875, 4.243408203125, 4.43927001953125, 4.6351318359375, 4.83099365234375, 5.02685546875, 5.22271728515625, 5.4185791015625, 5.61444091796875, 5.810302734375, 6.00616455078125, 6.2020263671875, 6.39788818359375, 6.59375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 4.0, 7.0, 4.0, 3.0, 10.0, 9.0, 9.0, 21.0, 27.0, 21.0, 38.0, 28.0, 68.0, 84.0, 154.0, 264.0, 596.0, 1979.0, 11649.0, 189300.0, 2414962.0, 1491607.0, 74735.0, 6220.0, 1378.0, 454.0, 206.0, 117.0, 67.0, 45.0, 36.0, 38.0, 19.0, 23.0, 22.0, 15.0, 10.0, 10.0, 9.0, 10.0, 6.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.7265625, -14.1978759765625, -13.669189453125, -13.1405029296875, -12.61181640625, -12.0831298828125, -11.554443359375, -11.0257568359375, -10.4970703125, -9.9683837890625, -9.439697265625, -8.9110107421875, -8.38232421875, -7.8536376953125, -7.324951171875, -6.7962646484375, -6.267578125, -5.7388916015625, -5.210205078125, -4.6815185546875, -4.15283203125, -3.6241455078125, -3.095458984375, -2.5667724609375, -2.0380859375, -1.5093994140625, -0.980712890625, -0.4520263671875, 0.07666015625, 0.6053466796875, 1.134033203125, 1.6627197265625, 2.19140625, 2.7200927734375, 3.248779296875, 3.7774658203125, 4.30615234375, 4.8348388671875, 5.363525390625, 5.8922119140625, 6.4208984375, 6.9495849609375, 7.478271484375, 8.0069580078125, 8.53564453125, 9.0643310546875, 9.593017578125, 10.1217041015625, 10.650390625, 11.1790771484375, 11.707763671875, 12.2364501953125, 12.76513671875, 13.2938232421875, 13.822509765625, 14.3511962890625, 14.8798828125, 15.4085693359375, 15.937255859375, 16.4659423828125, 16.99462890625, 17.5233154296875, 18.052001953125, 18.5806884765625, 19.109375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 5.0, 6.0, 7.0, 9.0, 25.0, 24.0, 31.0, 49.0, 57.0, 109.0, 136.0, 218.0, 297.0, 453.0, 536.0, 548.0, 458.0, 329.0, 244.0, 189.0, 103.0, 85.0, 55.0, 29.0, 19.0, 18.0, 15.0, 11.0, 5.0, 7.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7578125, -12.2884521484375, -11.819091796875, -11.3497314453125, -10.88037109375, -10.4110107421875, -9.941650390625, -9.4722900390625, -9.0029296875, -8.5335693359375, -8.064208984375, -7.5948486328125, -7.12548828125, -6.6561279296875, -6.186767578125, -5.7174072265625, -5.248046875, -4.7786865234375, -4.309326171875, -3.8399658203125, -3.37060546875, -2.9012451171875, -2.431884765625, -1.9625244140625, -1.4931640625, -1.0238037109375, -0.554443359375, -0.0850830078125, 0.38427734375, 0.8536376953125, 1.322998046875, 1.7923583984375, 2.26171875, 2.7310791015625, 3.200439453125, 3.6697998046875, 4.13916015625, 4.6085205078125, 5.077880859375, 5.5472412109375, 6.0166015625, 6.4859619140625, 6.955322265625, 7.4246826171875, 7.89404296875, 8.3634033203125, 8.832763671875, 9.3021240234375, 9.771484375, 10.2408447265625, 10.710205078125, 11.1795654296875, 11.64892578125, 12.1182861328125, 12.587646484375, 13.0570068359375, 13.5263671875, 13.9957275390625, 14.465087890625, 14.9344482421875, 15.40380859375, 15.8731689453125, 16.342529296875, 16.8118896484375, 17.28125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 5.0, 7.0, 12.0, 12.0, 14.0, 14.0, 22.0, 28.0, 24.0, 45.0, 60.0, 65.0, 103.0, 130.0, 184.0, 254.0, 414.0, 751.0, 3234.0, 441959.0, 3725678.0, 18341.0, 1212.0, 517.0, 320.0, 207.0, 171.0, 101.0, 88.0, 68.0, 55.0, 41.0, 48.0, 32.0, 21.0, 16.0, 9.0, 4.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.71875, -52.19384765625, -50.6689453125, -49.14404296875, -47.619140625, -46.09423828125, -44.5693359375, -43.04443359375, -41.51953125, -39.99462890625, -38.4697265625, -36.94482421875, -35.419921875, -33.89501953125, -32.3701171875, -30.84521484375, -29.3203125, -27.79541015625, -26.2705078125, -24.74560546875, -23.220703125, -21.69580078125, -20.1708984375, -18.64599609375, -17.12109375, -15.59619140625, -14.0712890625, -12.54638671875, -11.021484375, -9.49658203125, -7.9716796875, -6.44677734375, -4.921875, -3.39697265625, -1.8720703125, -0.34716796875, 1.177734375, 2.70263671875, 4.2275390625, 5.75244140625, 7.27734375, 8.80224609375, 10.3271484375, 11.85205078125, 13.376953125, 14.90185546875, 16.4267578125, 17.95166015625, 19.4765625, 21.00146484375, 22.5263671875, 24.05126953125, 25.576171875, 27.10107421875, 28.6259765625, 30.15087890625, 31.67578125, 33.20068359375, 34.7255859375, 36.25048828125, 37.775390625, 39.30029296875, 40.8251953125, 42.35009765625, 43.875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 55.0, 179.0, 347.0, 255.0, 141.0, 24.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-264.9462585449219, -260.19915771484375, -255.4520263671875, -250.7049102783203, -245.95779418945312, -241.21067810058594, -236.46356201171875, -231.71644592285156, -226.96932983398438, -222.2222137451172, -217.47509765625, -212.7279815673828, -207.98086547851562, -203.23374938964844, -198.48663330078125, -193.73951721191406, -188.99240112304688, -184.2452850341797, -179.4981689453125, -174.7510528564453, -170.00393676757812, -165.25682067871094, -160.50970458984375, -155.76258850097656, -151.01547241210938, -146.2683563232422, -141.521240234375, -136.7741241455078, -132.02700805664062, -127.27989196777344, -122.53277587890625, -117.78565979003906, -113.03852844238281, -108.29141235351562, -103.54429626464844, -98.79718017578125, -94.05006408691406, -89.30294799804688, -84.55583190917969, -79.8087158203125, -75.06159973144531, -70.31448364257812, -65.56736755371094, -60.82025146484375, -56.07313537597656, -51.326019287109375, -46.57890319824219, -41.831787109375, -37.08467483520508, -32.33755874633789, -27.590442657470703, -22.843326568603516, -18.096210479736328, -13.34909439086914, -8.601978302001953, -3.8548622131347656, 0.8922538757324219, 5.639369964599609, 10.386486053466797, 15.133602142333984, 19.880718231201172, 24.62783432006836, 29.374950408935547, 34.122066497802734, 38.86918258666992]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 8.0, 6.0, 9.0, 9.0, 9.0, 18.0, 14.0, 21.0, 25.0, 25.0, 30.0, 23.0, 31.0, 43.0, 43.0, 41.0, 35.0, 36.0, 40.0, 44.0, 39.0, 37.0, 42.0, 41.0, 39.0, 37.0, 37.0, 33.0, 27.0, 22.0, 23.0, 22.0, 14.0, 14.0, 7.0, 12.0, 8.0, 6.0, 8.0, 4.0, 4.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-37.302757263183594, -36.025535583496094, -34.748313903808594, -33.47109603881836, -32.19387435913086, -30.91665267944336, -29.63943099975586, -28.362211227416992, -27.084991455078125, -25.807769775390625, -24.530550003051758, -23.253328323364258, -21.97610855102539, -20.69888687133789, -19.42166519165039, -18.144445419311523, -16.867223739624023, -15.59000301361084, -14.312782287597656, -13.035560607910156, -11.758340835571289, -10.481119155883789, -9.203898429870605, -7.926677703857422, -6.649456977844238, -5.372236251831055, -4.095015525817871, -2.8177943229675293, -1.5405735969543457, -0.2633528709411621, 1.0138683319091797, 2.2910890579223633, 3.568309783935547, 4.8455305099487305, 6.122751235961914, 7.399972438812256, 8.677192687988281, 9.954414367675781, 11.231635093688965, 12.508855819702148, 13.786076545715332, 15.063297271728516, 16.340518951416016, 17.617738723754883, 18.894960403442383, 20.17218017578125, 21.44940185546875, 22.72662353515625, 24.003843307495117, 25.281064987182617, 26.558284759521484, 27.835506439208984, 29.11272621154785, 30.38994789123535, 31.66716766357422, 32.94438934326172, 34.22161102294922, 35.49883270263672, 36.77605438232422, 38.05327224731445, 39.33049392700195, 40.60771560668945, 41.88493728637695, 43.16215515136719, 44.43937683105469]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 1.0, 2.0, 6.0, 5.0, 9.0, 12.0, 12.0, 9.0, 22.0, 15.0, 21.0, 15.0, 15.0, 15.0, 28.0, 31.0, 26.0, 23.0, 40.0, 45.0, 46.0, 38.0, 38.0, 46.0, 48.0, 43.0, 29.0, 40.0, 36.0, 26.0, 29.0, 32.0, 29.0, 25.0, 19.0, 15.0, 17.0, 19.0, 16.0, 12.0, 8.0, 6.0, 5.0, 10.0, 7.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.1796875, -5.98870849609375, -5.7977294921875, -5.60675048828125, -5.415771484375, -5.22479248046875, -5.0338134765625, -4.84283447265625, -4.65185546875, -4.46087646484375, -4.2698974609375, -4.07891845703125, -3.887939453125, -3.69696044921875, -3.5059814453125, -3.31500244140625, -3.1240234375, -2.93304443359375, -2.7420654296875, -2.55108642578125, -2.360107421875, -2.16912841796875, -1.9781494140625, -1.78717041015625, -1.59619140625, -1.40521240234375, -1.2142333984375, -1.02325439453125, -0.832275390625, -0.64129638671875, -0.4503173828125, -0.25933837890625, -0.068359375, 0.12261962890625, 0.3135986328125, 0.50457763671875, 0.695556640625, 0.88653564453125, 1.0775146484375, 1.26849365234375, 1.45947265625, 1.65045166015625, 1.8414306640625, 2.03240966796875, 2.223388671875, 2.41436767578125, 2.6053466796875, 2.79632568359375, 2.9873046875, 3.17828369140625, 3.3692626953125, 3.56024169921875, 3.751220703125, 3.94219970703125, 4.1331787109375, 4.32415771484375, 4.51513671875, 4.70611572265625, 4.8970947265625, 5.08807373046875, 5.279052734375, 5.47003173828125, 5.6610107421875, 5.85198974609375, 6.04296875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 8.0, 3.0, 14.0, 28.0, 36.0, 33.0, 80.0, 115.0, 144.0, 208.0, 283.0, 407.0, 587.0, 799.0, 1179.0, 1615.0, 2423.0, 3444.0, 5095.0, 7539.0, 11453.0, 17596.0, 26879.0, 42711.0, 68080.0, 110582.0, 169450.0, 191102.0, 141707.0, 89251.0, 54989.0, 34503.0, 22041.0, 14399.0, 9310.0, 6377.0, 4232.0, 2989.0, 2074.0, 1424.0, 975.0, 690.0, 499.0, 378.0, 251.0, 162.0, 120.0, 79.0, 76.0, 36.0, 30.0, 27.0, 14.0, 10.0, 10.0, 8.0, 6.0], "bins": [-0.7177734375, -0.6968307495117188, -0.6758880615234375, -0.6549453735351562, -0.634002685546875, -0.6130599975585938, -0.5921173095703125, -0.5711746215820312, -0.55023193359375, -0.5292892456054688, -0.5083465576171875, -0.48740386962890625, -0.466461181640625, -0.44551849365234375, -0.4245758056640625, -0.40363311767578125, -0.3826904296875, -0.36174774169921875, -0.3408050537109375, -0.31986236572265625, -0.298919677734375, -0.27797698974609375, -0.2570343017578125, -0.23609161376953125, -0.21514892578125, -0.19420623779296875, -0.1732635498046875, -0.15232086181640625, -0.131378173828125, -0.11043548583984375, -0.0894927978515625, -0.06855010986328125, -0.047607421875, -0.02666473388671875, -0.0057220458984375, 0.01522064208984375, 0.036163330078125, 0.05710601806640625, 0.0780487060546875, 0.09899139404296875, 0.11993408203125, 0.14087677001953125, 0.1618194580078125, 0.18276214599609375, 0.203704833984375, 0.22464752197265625, 0.2455902099609375, 0.26653289794921875, 0.2874755859375, 0.30841827392578125, 0.3293609619140625, 0.35030364990234375, 0.371246337890625, 0.39218902587890625, 0.4131317138671875, 0.43407440185546875, 0.45501708984375, 0.47595977783203125, 0.4969024658203125, 0.5178451538085938, 0.538787841796875, 0.5597305297851562, 0.5806732177734375, 0.6016159057617188, 0.62255859375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 0.0, 4.0, 4.0, 4.0, 7.0, 8.0, 13.0, 13.0, 14.0, 19.0, 11.0, 25.0, 20.0, 27.0, 31.0, 29.0, 29.0, 24.0, 32.0, 33.0, 38.0, 49.0, 50.0, 1062.0, 36.0, 48.0, 47.0, 50.0, 41.0, 34.0, 25.0, 23.0, 26.0, 25.0, 17.0, 17.0, 11.0, 17.0, 7.0, 10.0, 10.0, 10.0, 10.0, 3.0, 5.0, 1.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.20703125, -4.08111572265625, -3.9552001953125, -3.82928466796875, -3.703369140625, -3.57745361328125, -3.4515380859375, -3.32562255859375, -3.19970703125, -3.07379150390625, -2.9478759765625, -2.82196044921875, -2.696044921875, -2.57012939453125, -2.4442138671875, -2.31829833984375, -2.1923828125, -2.06646728515625, -1.9405517578125, -1.81463623046875, -1.688720703125, -1.56280517578125, -1.4368896484375, -1.31097412109375, -1.18505859375, -1.05914306640625, -0.9332275390625, -0.80731201171875, -0.681396484375, -0.55548095703125, -0.4295654296875, -0.30364990234375, -0.177734375, -0.05181884765625, 0.0740966796875, 0.20001220703125, 0.325927734375, 0.45184326171875, 0.5777587890625, 0.70367431640625, 0.82958984375, 0.95550537109375, 1.0814208984375, 1.20733642578125, 1.333251953125, 1.45916748046875, 1.5850830078125, 1.71099853515625, 1.8369140625, 1.96282958984375, 2.0887451171875, 2.21466064453125, 2.340576171875, 2.46649169921875, 2.5924072265625, 2.71832275390625, 2.84423828125, 2.97015380859375, 3.0960693359375, 3.22198486328125, 3.347900390625, 3.47381591796875, 3.5997314453125, 3.72564697265625, 3.8515625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 9.0, 6.0, 7.0, 12.0, 19.0, 27.0, 59.0, 75.0, 101.0, 179.0, 275.0, 448.0, 679.0, 1251.0, 2051.0, 3346.0, 5758.0, 9868.0, 17507.0, 31619.0, 59318.0, 112361.0, 196919.0, 1288490.0, 167163.0, 90475.0, 48268.0, 26136.0, 14245.0, 8307.0, 4855.0, 2854.0, 1691.0, 1031.0, 622.0, 418.0, 253.0, 158.0, 97.0, 58.0, 43.0, 28.0, 20.0, 16.0, 11.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0], "bins": [-0.85107421875, -0.8269882202148438, -0.8029022216796875, -0.7788162231445312, -0.754730224609375, -0.7306442260742188, -0.7065582275390625, -0.6824722290039062, -0.65838623046875, -0.6343002319335938, -0.6102142333984375, -0.5861282348632812, -0.562042236328125, -0.5379562377929688, -0.5138702392578125, -0.48978424072265625, -0.4656982421875, -0.44161224365234375, -0.4175262451171875, -0.39344024658203125, -0.369354248046875, -0.34526824951171875, -0.3211822509765625, -0.29709625244140625, -0.27301025390625, -0.24892425537109375, -0.2248382568359375, -0.20075225830078125, -0.176666259765625, -0.15258026123046875, -0.1284942626953125, -0.10440826416015625, -0.080322265625, -0.05623626708984375, -0.0321502685546875, -0.00806427001953125, 0.016021728515625, 0.04010772705078125, 0.0641937255859375, 0.08827972412109375, 0.11236572265625, 0.13645172119140625, 0.1605377197265625, 0.18462371826171875, 0.208709716796875, 0.23279571533203125, 0.2568817138671875, 0.28096771240234375, 0.3050537109375, 0.32913970947265625, 0.3532257080078125, 0.37731170654296875, 0.401397705078125, 0.42548370361328125, 0.4495697021484375, 0.47365570068359375, 0.49774169921875, 0.5218276977539062, 0.5459136962890625, 0.5699996948242188, 0.594085693359375, 0.6181716918945312, 0.6422576904296875, 0.6663436889648438, 0.6904296875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 6.0, 12.0, 10.0, 18.0, 17.0, 14.0, 23.0, 22.0, 29.0, 26.0, 28.0, 48.0, 40.0, 44.0, 40.0, 45.0, 49.0, 62.0, 51.0, 46.0, 56.0, 39.0, 32.0, 39.0, 34.0, 19.0, 31.0, 14.0, 16.0, 17.0, 16.0, 10.0, 3.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0019702911376953125, -0.0019125789403915405, -0.0018548667430877686, -0.0017971545457839966, -0.0017394423484802246, -0.0016817301511764526, -0.0016240179538726807, -0.0015663057565689087, -0.0015085935592651367, -0.0014508813619613647, -0.0013931691646575928, -0.0013354569673538208, -0.0012777447700500488, -0.0012200325727462769, -0.0011623203754425049, -0.001104608178138733, -0.001046895980834961, -0.000989183783531189, -0.000931471586227417, -0.000873759388923645, -0.000816047191619873, -0.0007583349943161011, -0.0007006227970123291, -0.0006429105997085571, -0.0005851984024047852, -0.0005274862051010132, -0.0004697740077972412, -0.00041206181049346924, -0.00035434961318969727, -0.0002966374158859253, -0.00023892521858215332, -0.00018121302127838135, -0.00012350082397460938, -6.57886266708374e-05, -8.07642936706543e-06, 4.963576793670654e-05, 0.00010734796524047852, 0.0001650601625442505, 0.00022277235984802246, 0.00028048455715179443, 0.0003381967544555664, 0.0003959089517593384, 0.00045362114906311035, 0.0005113333463668823, 0.0005690455436706543, 0.0006267577409744263, 0.0006844699382781982, 0.0007421821355819702, 0.0007998943328857422, 0.0008576065301895142, 0.0009153187274932861, 0.0009730309247970581, 0.00103074312210083, 0.001088455319404602, 0.001146167516708374, 0.001203879714012146, 0.001261591911315918, 0.00131930410861969, 0.001377016305923462, 0.0014347285032272339, 0.0014924407005310059, 0.0015501528978347778, 0.0016078650951385498, 0.0016655772924423218, 0.0017232894897460938]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 7.0, 10.0, 8.0, 26.0, 22.0, 29.0, 21.0, 48.0, 53.0, 58.0, 89.0, 143.0, 276.0, 763.0, 4292.0, 1035334.0, 5667.0, 794.0, 288.0, 148.0, 102.0, 78.0, 49.0, 46.0, 34.0, 30.0, 14.0, 24.0, 13.0, 17.0, 8.0, 13.0, 9.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04180908203125, -0.040439605712890625, -0.03907012939453125, -0.037700653076171875, -0.0363311767578125, -0.034961700439453125, -0.03359222412109375, -0.032222747802734375, -0.030853271484375, -0.029483795166015625, -0.02811431884765625, -0.026744842529296875, -0.0253753662109375, -0.024005889892578125, -0.02263641357421875, -0.021266937255859375, -0.0198974609375, -0.018527984619140625, -0.01715850830078125, -0.015789031982421875, -0.0144195556640625, -0.013050079345703125, -0.01168060302734375, -0.010311126708984375, -0.008941650390625, -0.007572174072265625, -0.00620269775390625, -0.004833221435546875, -0.0034637451171875, -0.002094268798828125, -0.00072479248046875, 0.000644683837890625, 0.00201416015625, 0.003383636474609375, 0.00475311279296875, 0.006122589111328125, 0.0074920654296875, 0.008861541748046875, 0.01023101806640625, 0.011600494384765625, 0.012969970703125, 0.014339447021484375, 0.01570892333984375, 0.017078399658203125, 0.0184478759765625, 0.019817352294921875, 0.02118682861328125, 0.022556304931640625, 0.02392578125, 0.025295257568359375, 0.02666473388671875, 0.028034210205078125, 0.0294036865234375, 0.030773162841796875, 0.03214263916015625, 0.033512115478515625, 0.034881591796875, 0.036251068115234375, 0.03762054443359375, 0.038990020751953125, 0.0403594970703125, 0.041728973388671875, 0.04309844970703125, 0.044467926025390625, 0.04583740234375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 398.0, 616.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02293269895017147, -0.022516237571835518, -0.022099776193499565, -0.021683314815163612, -0.02126685343682766, -0.020850392058491707, -0.020433930680155754, -0.0200174693018198, -0.01960100792348385, -0.019184546545147896, -0.018768085166811943, -0.01835162378847599, -0.017935162410140038, -0.017518701031804085, -0.017102239653468132, -0.01668577827513218, -0.016269316896796227, -0.015852855518460274, -0.015436394140124321, -0.015019932761788368, -0.014603471383452415, -0.014187010005116463, -0.01377054862678051, -0.013354087248444557, -0.012937626801431179, -0.012521165423095226, -0.012104704044759274, -0.01168824266642332, -0.011271781288087368, -0.010855319909751415, -0.010438858531415462, -0.01002239715307951, -0.009605935774743557, -0.009189474396407604, -0.008773013018071651, -0.008356551639735699, -0.007940090261399746, -0.007523628883063793, -0.00710716750472784, -0.006690706126391888, -0.006274244748055935, -0.005857783369719982, -0.005441321991384029, -0.005024860613048077, -0.004608399234712124, -0.004191937856376171, -0.003775476710870862, -0.0033590153325349092, -0.0029425539541989565, -0.0025260925758630037, -0.002109631197527051, -0.00169316993560642, -0.0012767085572704673, -0.0008602472953498363, -0.0004437859170138836, -2.7324538677930832e-05, 0.0003891368396580219, 0.0008055982179939747, 0.0012220595963299274, 0.0016385208582505584, 0.002054982353001833, 0.002471443498507142, 0.002887904876843095, 0.0033043662551790476, 0.0037208276335150003]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 8.0, 7.0, 10.0, 11.0, 10.0, 11.0, 21.0, 12.0, 24.0, 25.0, 32.0, 34.0, 46.0, 33.0, 35.0, 40.0, 48.0, 43.0, 54.0, 44.0, 44.0, 41.0, 42.0, 43.0, 32.0, 49.0, 32.0, 30.0, 30.0, 34.0, 18.0, 17.0, 9.0, 10.0, 5.0, 5.0, 3.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011264681816101074, -0.0010897452011704445, -0.0010530222207307816, -0.0010162992402911186, -0.0009795762598514557, -0.0009428532794117928, -0.0009061302989721298, -0.0008694073185324669, -0.000832684338092804, -0.000795961357653141, -0.0007592383772134781, -0.0007225153967738152, -0.0006857924163341522, -0.0006490694358944893, -0.0006123464554548264, -0.0005756234750151634, -0.0005389004945755005, -0.0005021775141358376, -0.0004654545336961746, -0.0004287315532565117, -0.00039200857281684875, -0.0003552855923771858, -0.0003185626119375229, -0.00028183963149785995, -0.000245116651058197, -0.0002083936706185341, -0.00017167069017887115, -0.00013494770973920822, -9.822472929954529e-05, -6.150174885988235e-05, -2.477876842021942e-05, 1.1944212019443512e-05, 4.8667192459106445e-05, 8.539017289876938e-05, 0.0001221131533384323, 0.00015883613377809525, 0.00019555911421775818, 0.0002322820946574211, 0.00026900507509708405, 0.000305728055536747, 0.0003424510359764099, 0.00037917401641607285, 0.0004158969968557358, 0.0004526199772953987, 0.0004893429577350616, 0.0005260659381747246, 0.0005627889186143875, 0.0005995118990540504, 0.0006362348794937134, 0.0006729578599333763, 0.0007096808403730392, 0.0007464038208127022, 0.0007831268012523651, 0.000819849781692028, 0.000856572762131691, 0.0008932957425713539, 0.0009300187230110168, 0.0009667417034506798, 0.0010034646838903427, 0.0010401876643300056, 0.0010769106447696686, 0.0011136336252093315, 0.0011503566056489944, 0.0011870795860886574, 0.0012238025665283203]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 1.0, 2.0, 6.0, 5.0, 9.0, 12.0, 12.0, 9.0, 22.0, 15.0, 21.0, 15.0, 15.0, 15.0, 28.0, 31.0, 26.0, 23.0, 40.0, 45.0, 46.0, 38.0, 38.0, 46.0, 48.0, 43.0, 29.0, 40.0, 36.0, 26.0, 29.0, 32.0, 29.0, 25.0, 19.0, 15.0, 17.0, 19.0, 16.0, 12.0, 8.0, 6.0, 5.0, 10.0, 7.0, 8.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.1796875, -5.98870849609375, -5.7977294921875, -5.60675048828125, -5.415771484375, -5.22479248046875, -5.0338134765625, -4.84283447265625, -4.65185546875, -4.46087646484375, -4.2698974609375, -4.07891845703125, -3.887939453125, -3.69696044921875, -3.5059814453125, -3.31500244140625, -3.1240234375, -2.93304443359375, -2.7420654296875, -2.55108642578125, -2.360107421875, -2.16912841796875, -1.9781494140625, -1.78717041015625, -1.59619140625, -1.40521240234375, -1.2142333984375, -1.02325439453125, -0.832275390625, -0.64129638671875, -0.4503173828125, -0.25933837890625, -0.068359375, 0.12261962890625, 0.3135986328125, 0.50457763671875, 0.695556640625, 0.88653564453125, 1.0775146484375, 1.26849365234375, 1.45947265625, 1.65045166015625, 1.8414306640625, 2.03240966796875, 2.223388671875, 2.41436767578125, 2.6053466796875, 2.79632568359375, 2.9873046875, 3.17828369140625, 3.3692626953125, 3.56024169921875, 3.751220703125, 3.94219970703125, 4.1331787109375, 4.32415771484375, 4.51513671875, 4.70611572265625, 4.8970947265625, 5.08807373046875, 5.279052734375, 5.47003173828125, 5.6610107421875, 5.85198974609375, 6.04296875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 3.0, 1.0, 3.0, 6.0, 6.0, 11.0, 15.0, 22.0, 19.0, 31.0, 35.0, 50.0, 69.0, 95.0, 168.0, 239.0, 419.0, 710.0, 1315.0, 2706.0, 5860.0, 14826.0, 48680.0, 223311.0, 552911.0, 142764.0, 33679.0, 11037.0, 4647.0, 2140.0, 1094.0, 583.0, 361.0, 231.0, 154.0, 96.0, 62.0, 51.0, 42.0, 28.0, 17.0, 14.0, 8.0, 8.0, 12.0, 7.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.98046875, -5.795654296875, -5.61083984375, -5.426025390625, -5.2412109375, -5.056396484375, -4.87158203125, -4.686767578125, -4.501953125, -4.317138671875, -4.13232421875, -3.947509765625, -3.7626953125, -3.577880859375, -3.39306640625, -3.208251953125, -3.0234375, -2.838623046875, -2.65380859375, -2.468994140625, -2.2841796875, -2.099365234375, -1.91455078125, -1.729736328125, -1.544921875, -1.360107421875, -1.17529296875, -0.990478515625, -0.8056640625, -0.620849609375, -0.43603515625, -0.251220703125, -0.06640625, 0.118408203125, 0.30322265625, 0.488037109375, 0.6728515625, 0.857666015625, 1.04248046875, 1.227294921875, 1.412109375, 1.596923828125, 1.78173828125, 1.966552734375, 2.1513671875, 2.336181640625, 2.52099609375, 2.705810546875, 2.890625, 3.075439453125, 3.26025390625, 3.445068359375, 3.6298828125, 3.814697265625, 3.99951171875, 4.184326171875, 4.369140625, 4.553955078125, 4.73876953125, 4.923583984375, 5.1083984375, 5.293212890625, 5.47802734375, 5.662841796875, 5.84765625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 5.0, 7.0, 7.0, 5.0, 12.0, 13.0, 22.0, 32.0, 19.0, 24.0, 30.0, 34.0, 43.0, 30.0, 46.0, 30.0, 43.0, 76.0, 281.0, 1651.0, 157.0, 69.0, 35.0, 30.0, 44.0, 36.0, 36.0, 30.0, 27.0, 19.0, 27.0, 20.0, 16.0, 22.0, 4.0, 11.0, 8.0, 3.0, 8.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-19.125, -18.513427734375, -17.90185546875, -17.290283203125, -16.6787109375, -16.067138671875, -15.45556640625, -14.843994140625, -14.232421875, -13.620849609375, -13.00927734375, -12.397705078125, -11.7861328125, -11.174560546875, -10.56298828125, -9.951416015625, -9.33984375, -8.728271484375, -8.11669921875, -7.505126953125, -6.8935546875, -6.281982421875, -5.67041015625, -5.058837890625, -4.447265625, -3.835693359375, -3.22412109375, -2.612548828125, -2.0009765625, -1.389404296875, -0.77783203125, -0.166259765625, 0.4453125, 1.056884765625, 1.66845703125, 2.280029296875, 2.8916015625, 3.503173828125, 4.11474609375, 4.726318359375, 5.337890625, 5.949462890625, 6.56103515625, 7.172607421875, 7.7841796875, 8.395751953125, 9.00732421875, 9.618896484375, 10.23046875, 10.842041015625, 11.45361328125, 12.065185546875, 12.6767578125, 13.288330078125, 13.89990234375, 14.511474609375, 15.123046875, 15.734619140625, 16.34619140625, 16.957763671875, 17.5693359375, 18.180908203125, 18.79248046875, 19.404052734375, 20.015625]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 8.0, 12.0, 11.0, 15.0, 17.0, 25.0, 35.0, 51.0, 76.0, 98.0, 158.0, 247.0, 352.0, 857.0, 7403.0, 3121454.0, 12710.0, 984.0, 423.0, 226.0, 164.0, 102.0, 69.0, 58.0, 47.0, 26.0, 15.0, 12.0, 11.0, 11.0, 7.0, 6.0, 5.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-66.25, -64.3330078125, -62.416015625, -60.4990234375, -58.58203125, -56.6650390625, -54.748046875, -52.8310546875, -50.9140625, -48.9970703125, -47.080078125, -45.1630859375, -43.24609375, -41.3291015625, -39.412109375, -37.4951171875, -35.578125, -33.6611328125, -31.744140625, -29.8271484375, -27.91015625, -25.9931640625, -24.076171875, -22.1591796875, -20.2421875, -18.3251953125, -16.408203125, -14.4912109375, -12.57421875, -10.6572265625, -8.740234375, -6.8232421875, -4.90625, -2.9892578125, -1.072265625, 0.8447265625, 2.76171875, 4.6787109375, 6.595703125, 8.5126953125, 10.4296875, 12.3466796875, 14.263671875, 16.1806640625, 18.09765625, 20.0146484375, 21.931640625, 23.8486328125, 25.765625, 27.6826171875, 29.599609375, 31.5166015625, 33.43359375, 35.3505859375, 37.267578125, 39.1845703125, 41.1015625, 43.0185546875, 44.935546875, 46.8525390625, 48.76953125, 50.6865234375, 52.603515625, 54.5205078125, 56.4375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 44.0, 236.0, 472.0, 223.0, 37.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-89.24227905273438, -87.19169616699219, -85.14111328125, -83.09052276611328, -81.0399398803711, -78.9893569946289, -76.93877410888672, -74.88819122314453, -72.83760070800781, -70.78701782226562, -68.73643493652344, -66.68584442138672, -64.63526153564453, -62.584678649902344, -60.534095764160156, -58.48351287841797, -56.43292999267578, -54.382347106933594, -52.33176040649414, -50.28117752075195, -48.2305908203125, -46.18000793457031, -44.129425048828125, -42.07884216308594, -40.028255462646484, -37.9776725769043, -35.927085876464844, -33.876502990722656, -31.825918197631836, -29.775333404541016, -27.724750518798828, -25.674165725708008, -23.623584747314453, -21.572999954223633, -19.522415161132812, -17.471832275390625, -15.421247482299805, -13.370662689208984, -11.32007884979248, -9.269495010375977, -7.218910217285156, -5.168325901031494, -3.117741584777832, -1.06715726852417, 0.9834270477294922, 3.0340118408203125, 5.084595680236816, 7.13517951965332, 9.18576431274414, 11.236349105834961, 13.286932945251465, 15.337516784667969, 17.38810157775879, 19.43868637084961, 21.489269256591797, 23.539854049682617, 25.590438842773438, 27.641023635864258, 29.691608428955078, 31.742191314697266, 33.79277801513672, 35.843360900878906, 37.893943786621094, 39.94452667236328, 41.995113372802734]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 5.0, 7.0, 6.0, 13.0, 9.0, 8.0, 10.0, 19.0, 27.0, 29.0, 14.0, 23.0, 18.0, 36.0, 40.0, 46.0, 53.0, 48.0, 48.0, 48.0, 40.0, 55.0, 39.0, 54.0, 28.0, 28.0, 34.0, 25.0, 24.0, 24.0, 34.0, 19.0, 15.0, 15.0, 11.0, 11.0, 8.0, 5.0, 6.0, 4.0, 3.0, 1.0, 7.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.29931640625, -58.53845977783203, -56.77760696411133, -55.01675033569336, -53.25589370727539, -51.49504089355469, -49.73418426513672, -47.97332763671875, -46.21247100830078, -44.45161437988281, -42.69076156616211, -40.92990493774414, -39.16904830932617, -37.40819549560547, -35.6473388671875, -33.88648223876953, -32.12562561035156, -30.364770889282227, -28.603914260864258, -26.843059539794922, -25.082202911376953, -23.321348190307617, -21.56049346923828, -19.799636840820312, -18.03878402709961, -16.277929306030273, -14.517072677612305, -12.756217956542969, -10.995361328125, -9.234506607055664, -7.473650932312012, -5.712795257568359, -3.9519386291503906, -2.1910829544067383, -0.43022751808166504, 1.3306279182434082, 3.0914835929870605, 4.852338790893555, 6.613194465637207, 8.37405014038086, 10.134905815124512, 11.895761489868164, 13.656617164611816, 15.417472839355469, 17.178327560424805, 18.93918228149414, 20.70003890991211, 22.460895538330078, 24.221750259399414, 25.98260498046875, 27.74346160888672, 29.504316329956055, 31.265172958374023, 33.02602767944336, 34.78688430786133, 36.54773712158203, 38.30859375, 40.06945037841797, 41.83030319213867, 43.59115982055664, 45.35201644897461, 47.11286926269531, 48.87372589111328, 50.63458251953125, 52.39543914794922]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 4.0, 5.0, 7.0, 8.0, 13.0, 20.0, 14.0, 14.0, 11.0, 19.0, 20.0, 16.0, 19.0, 32.0, 21.0, 35.0, 39.0, 48.0, 38.0, 50.0, 29.0, 44.0, 48.0, 43.0, 44.0, 35.0, 30.0, 30.0, 21.0, 43.0, 30.0, 25.0, 22.0, 20.0, 16.0, 16.0, 16.0, 13.0, 7.0, 5.0, 7.0, 10.0, 6.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.3828125, -6.1806640625, -5.978515625, -5.7763671875, -5.57421875, -5.3720703125, -5.169921875, -4.9677734375, -4.765625, -4.5634765625, -4.361328125, -4.1591796875, -3.95703125, -3.7548828125, -3.552734375, -3.3505859375, -3.1484375, -2.9462890625, -2.744140625, -2.5419921875, -2.33984375, -2.1376953125, -1.935546875, -1.7333984375, -1.53125, -1.3291015625, -1.126953125, -0.9248046875, -0.72265625, -0.5205078125, -0.318359375, -0.1162109375, 0.0859375, 0.2880859375, 0.490234375, 0.6923828125, 0.89453125, 1.0966796875, 1.298828125, 1.5009765625, 1.703125, 1.9052734375, 2.107421875, 2.3095703125, 2.51171875, 2.7138671875, 2.916015625, 3.1181640625, 3.3203125, 3.5224609375, 3.724609375, 3.9267578125, 4.12890625, 4.3310546875, 4.533203125, 4.7353515625, 4.9375, 5.1396484375, 5.341796875, 5.5439453125, 5.74609375, 5.9482421875, 6.150390625, 6.3525390625, 6.5546875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 5.0, 3.0, 3.0, 4.0, 5.0, 5.0, 10.0, 10.0, 19.0, 22.0, 23.0, 25.0, 42.0, 31.0, 36.0, 55.0, 50.0, 65.0, 111.0, 194.0, 290.0, 526.0, 1417.0, 5976.0, 56114.0, 1045215.0, 2685961.0, 371572.0, 20894.0, 3316.0, 1020.0, 401.0, 205.0, 154.0, 101.0, 82.0, 58.0, 45.0, 33.0, 37.0, 27.0, 28.0, 29.0, 19.0, 10.0, 12.0, 7.0, 8.0, 2.0, 6.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.8984375, -15.4063720703125, -14.914306640625, -14.4222412109375, -13.93017578125, -13.4381103515625, -12.946044921875, -12.4539794921875, -11.9619140625, -11.4698486328125, -10.977783203125, -10.4857177734375, -9.99365234375, -9.5015869140625, -9.009521484375, -8.5174560546875, -8.025390625, -7.5333251953125, -7.041259765625, -6.5491943359375, -6.05712890625, -5.5650634765625, -5.072998046875, -4.5809326171875, -4.0888671875, -3.5968017578125, -3.104736328125, -2.6126708984375, -2.12060546875, -1.6285400390625, -1.136474609375, -0.6444091796875, -0.15234375, 0.3397216796875, 0.831787109375, 1.3238525390625, 1.81591796875, 2.3079833984375, 2.800048828125, 3.2921142578125, 3.7841796875, 4.2762451171875, 4.768310546875, 5.2603759765625, 5.75244140625, 6.2445068359375, 6.736572265625, 7.2286376953125, 7.720703125, 8.2127685546875, 8.704833984375, 9.1968994140625, 9.68896484375, 10.1810302734375, 10.673095703125, 11.1651611328125, 11.6572265625, 12.1492919921875, 12.641357421875, 13.1334228515625, 13.62548828125, 14.1175537109375, 14.609619140625, 15.1016845703125, 15.59375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 8.0, 10.0, 12.0, 12.0, 17.0, 40.0, 51.0, 58.0, 107.0, 172.0, 244.0, 343.0, 440.0, 550.0, 565.0, 466.0, 322.0, 216.0, 152.0, 104.0, 59.0, 38.0, 26.0, 16.0, 18.0, 11.0, 9.0, 7.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.662353515625, -17.18408203125, -16.705810546875, -16.2275390625, -15.749267578125, -15.27099609375, -14.792724609375, -14.314453125, -13.836181640625, -13.35791015625, -12.879638671875, -12.4013671875, -11.923095703125, -11.44482421875, -10.966552734375, -10.48828125, -10.010009765625, -9.53173828125, -9.053466796875, -8.5751953125, -8.096923828125, -7.61865234375, -7.140380859375, -6.662109375, -6.183837890625, -5.70556640625, -5.227294921875, -4.7490234375, -4.270751953125, -3.79248046875, -3.314208984375, -2.8359375, -2.357666015625, -1.87939453125, -1.401123046875, -0.9228515625, -0.444580078125, 0.03369140625, 0.511962890625, 0.990234375, 1.468505859375, 1.94677734375, 2.425048828125, 2.9033203125, 3.381591796875, 3.85986328125, 4.338134765625, 4.81640625, 5.294677734375, 5.77294921875, 6.251220703125, 6.7294921875, 7.207763671875, 7.68603515625, 8.164306640625, 8.642578125, 9.120849609375, 9.59912109375, 10.077392578125, 10.5556640625, 11.033935546875, 11.51220703125, 11.990478515625, 12.46875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 6.0, 10.0, 16.0, 18.0, 35.0, 23.0, 36.0, 59.0, 93.0, 113.0, 147.0, 217.0, 326.0, 493.0, 1246.0, 46623.0, 4114192.0, 28025.0, 1024.0, 476.0, 291.0, 224.0, 175.0, 117.0, 69.0, 73.0, 51.0, 30.0, 23.0, 18.0, 15.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.90625, -53.94189453125, -51.9775390625, -50.01318359375, -48.048828125, -46.08447265625, -44.1201171875, -42.15576171875, -40.19140625, -38.22705078125, -36.2626953125, -34.29833984375, -32.333984375, -30.36962890625, -28.4052734375, -26.44091796875, -24.4765625, -22.51220703125, -20.5478515625, -18.58349609375, -16.619140625, -14.65478515625, -12.6904296875, -10.72607421875, -8.76171875, -6.79736328125, -4.8330078125, -2.86865234375, -0.904296875, 1.06005859375, 3.0244140625, 4.98876953125, 6.953125, 8.91748046875, 10.8818359375, 12.84619140625, 14.810546875, 16.77490234375, 18.7392578125, 20.70361328125, 22.66796875, 24.63232421875, 26.5966796875, 28.56103515625, 30.525390625, 32.48974609375, 34.4541015625, 36.41845703125, 38.3828125, 40.34716796875, 42.3115234375, 44.27587890625, 46.240234375, 48.20458984375, 50.1689453125, 52.13330078125, 54.09765625, 56.06201171875, 58.0263671875, 59.99072265625, 61.955078125, 63.91943359375, 65.8837890625, 67.84814453125, 69.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 31.0, 150.0, 360.0, 314.0, 134.0, 19.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.0688934326172, -187.9818572998047, -182.89483642578125, -177.80780029296875, -172.72076416015625, -167.63372802734375, -162.5467071533203, -157.4596710205078, -152.37265014648438, -147.28561401367188, -142.19859313964844, -137.11155700683594, -132.02452087402344, -126.93749237060547, -121.8504638671875, -116.763427734375, -111.6763916015625, -106.58936309814453, -101.50232696533203, -96.41529846191406, -91.32826232910156, -86.2412338256836, -81.15420532226562, -76.06716918945312, -70.98014068603516, -65.89311218261719, -60.80607604980469, -55.71904754638672, -50.632015228271484, -45.54498291015625, -40.45795440673828, -35.37092208862305, -30.28387451171875, -25.196842193603516, -20.109811782836914, -15.022780418395996, -9.935749053955078, -4.848716735839844, 0.2383136749267578, 5.325344085693359, 10.412376403808594, 15.499407768249512, 20.58643913269043, 25.67346954345703, 30.760501861572266, 35.8475341796875, 40.93456268310547, 46.0215950012207, 51.10862731933594, 56.19565963745117, 61.282691955566406, 66.36972045898438, 71.45675659179688, 76.54378509521484, 81.63081359863281, 86.71784973144531, 91.80487823486328, 96.89190673828125, 101.97894287109375, 107.06597137451172, 112.15299987792969, 117.24003601074219, 122.32706451416016, 127.41409301757812, 132.50112915039062]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 9.0, 6.0, 4.0, 9.0, 8.0, 10.0, 15.0, 12.0, 13.0, 14.0, 14.0, 17.0, 15.0, 26.0, 24.0, 21.0, 29.0, 31.0, 34.0, 43.0, 33.0, 32.0, 32.0, 33.0, 32.0, 35.0, 48.0, 37.0, 33.0, 39.0, 22.0, 26.0, 27.0, 22.0, 21.0, 24.0, 19.0, 24.0, 16.0, 11.0, 15.0, 12.0, 12.0, 20.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-34.1666259765625, -33.10106658935547, -32.03550338745117, -30.96994400024414, -29.90438461303711, -28.838823318481445, -27.77326202392578, -26.70770263671875, -25.642141342163086, -24.576580047607422, -23.51102066040039, -22.445459365844727, -21.379898071289062, -20.31433868408203, -19.248777389526367, -18.183216094970703, -17.117656707763672, -16.052095413208008, -14.986536026000977, -13.920974731445312, -12.855414390563965, -11.789854049682617, -10.724292755126953, -9.658732414245605, -8.593172073364258, -7.52761173248291, -6.462050914764404, -5.396490097045898, -4.330929756164551, -3.265369415283203, -2.1998085975646973, -1.1342477798461914, -0.06868743896484375, 0.996873140335083, 2.0624337196350098, 3.1279942989349365, 4.193554878234863, 5.259115219116211, 6.324676036834717, 7.390236854553223, 8.45579719543457, 9.521357536315918, 10.586917877197266, 11.65247917175293, 12.718039512634277, 13.783599853515625, 14.849161148071289, 15.914721488952637, 16.980281829833984, 18.04584312438965, 19.11140251159668, 20.176963806152344, 21.242523193359375, 22.30808448791504, 23.373645782470703, 24.439205169677734, 25.5047664642334, 26.570327758789062, 27.635887145996094, 28.701448440551758, 29.767009735107422, 30.832569122314453, 31.898130416870117, 32.96369171142578, 34.02925109863281]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 3.0, 6.0, 9.0, 12.0, 10.0, 10.0, 13.0, 10.0, 10.0, 17.0, 23.0, 26.0, 25.0, 20.0, 26.0, 19.0, 32.0, 29.0, 43.0, 45.0, 37.0, 47.0, 40.0, 32.0, 41.0, 34.0, 36.0, 28.0, 31.0, 47.0, 30.0, 24.0, 24.0, 15.0, 22.0, 21.0, 15.0, 13.0, 12.0, 16.0, 13.0, 6.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.234375, -6.04779052734375, -5.8612060546875, -5.67462158203125, -5.488037109375, -5.30145263671875, -5.1148681640625, -4.92828369140625, -4.74169921875, -4.55511474609375, -4.3685302734375, -4.18194580078125, -3.995361328125, -3.80877685546875, -3.6221923828125, -3.43560791015625, -3.2490234375, -3.06243896484375, -2.8758544921875, -2.68927001953125, -2.502685546875, -2.31610107421875, -2.1295166015625, -1.94293212890625, -1.75634765625, -1.56976318359375, -1.3831787109375, -1.19659423828125, -1.010009765625, -0.82342529296875, -0.6368408203125, -0.45025634765625, -0.263671875, -0.07708740234375, 0.1094970703125, 0.29608154296875, 0.482666015625, 0.66925048828125, 0.8558349609375, 1.04241943359375, 1.22900390625, 1.41558837890625, 1.6021728515625, 1.78875732421875, 1.975341796875, 2.16192626953125, 2.3485107421875, 2.53509521484375, 2.7216796875, 2.90826416015625, 3.0948486328125, 3.28143310546875, 3.468017578125, 3.65460205078125, 3.8411865234375, 4.02777099609375, 4.21435546875, 4.40093994140625, 4.5875244140625, 4.77410888671875, 4.960693359375, 5.14727783203125, 5.3338623046875, 5.52044677734375, 5.70703125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 6.0, 10.0, 19.0, 29.0, 33.0, 47.0, 58.0, 100.0, 162.0, 231.0, 327.0, 464.0, 641.0, 999.0, 1398.0, 2012.0, 2803.0, 4063.0, 5592.0, 8021.0, 12067.0, 17894.0, 26582.0, 41297.0, 65794.0, 106414.0, 160777.0, 185894.0, 144893.0, 92356.0, 57069.0, 35995.0, 23610.0, 15923.0, 10573.0, 7336.0, 5132.0, 3569.0, 2539.0, 1757.0, 1267.0, 849.0, 608.0, 417.0, 329.0, 191.0, 115.0, 95.0, 83.0, 37.0, 30.0, 21.0, 10.0, 7.0, 5.0, 7.0, 6.0, 1.0, 3.0, 2.0], "bins": [-0.6015625, -0.5823745727539062, -0.5631866455078125, -0.5439987182617188, -0.524810791015625, -0.5056228637695312, -0.4864349365234375, -0.46724700927734375, -0.44805908203125, -0.42887115478515625, -0.4096832275390625, -0.39049530029296875, -0.371307373046875, -0.35211944580078125, -0.3329315185546875, -0.31374359130859375, -0.2945556640625, -0.27536773681640625, -0.2561798095703125, -0.23699188232421875, -0.217803955078125, -0.19861602783203125, -0.1794281005859375, -0.16024017333984375, -0.14105224609375, -0.12186431884765625, -0.1026763916015625, -0.08348846435546875, -0.064300537109375, -0.04511260986328125, -0.0259246826171875, -0.00673675537109375, 0.012451171875, 0.03163909912109375, 0.0508270263671875, 0.07001495361328125, 0.089202880859375, 0.10839080810546875, 0.1275787353515625, 0.14676666259765625, 0.16595458984375, 0.18514251708984375, 0.2043304443359375, 0.22351837158203125, 0.242706298828125, 0.26189422607421875, 0.2810821533203125, 0.30027008056640625, 0.3194580078125, 0.33864593505859375, 0.3578338623046875, 0.37702178955078125, 0.396209716796875, 0.41539764404296875, 0.4345855712890625, 0.45377349853515625, 0.47296142578125, 0.49214935302734375, 0.5113372802734375, 0.5305252075195312, 0.549713134765625, 0.5689010620117188, 0.5880889892578125, 0.6072769165039062, 0.62646484375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 4.0, 15.0, 21.0, 16.0, 18.0, 20.0, 12.0, 24.0, 23.0, 32.0, 26.0, 37.0, 42.0, 27.0, 42.0, 44.0, 46.0, 1070.0, 42.0, 35.0, 35.0, 34.0, 41.0, 43.0, 40.0, 32.0, 25.0, 19.0, 18.0, 19.0, 21.0, 18.0, 10.0, 11.0, 9.0, 8.0, 7.0, 3.0, 3.0, 10.0, 6.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7890625, -3.661376953125, -3.53369140625, -3.406005859375, -3.2783203125, -3.150634765625, -3.02294921875, -2.895263671875, -2.767578125, -2.639892578125, -2.51220703125, -2.384521484375, -2.2568359375, -2.129150390625, -2.00146484375, -1.873779296875, -1.74609375, -1.618408203125, -1.49072265625, -1.363037109375, -1.2353515625, -1.107666015625, -0.97998046875, -0.852294921875, -0.724609375, -0.596923828125, -0.46923828125, -0.341552734375, -0.2138671875, -0.086181640625, 0.04150390625, 0.169189453125, 0.296875, 0.424560546875, 0.55224609375, 0.679931640625, 0.8076171875, 0.935302734375, 1.06298828125, 1.190673828125, 1.318359375, 1.446044921875, 1.57373046875, 1.701416015625, 1.8291015625, 1.956787109375, 2.08447265625, 2.212158203125, 2.33984375, 2.467529296875, 2.59521484375, 2.722900390625, 2.8505859375, 2.978271484375, 3.10595703125, 3.233642578125, 3.361328125, 3.489013671875, 3.61669921875, 3.744384765625, 3.8720703125, 3.999755859375, 4.12744140625, 4.255126953125, 4.3828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 8.0, 16.0, 21.0, 31.0, 51.0, 67.0, 82.0, 156.0, 216.0, 297.0, 479.0, 719.0, 1110.0, 1696.0, 2669.0, 4189.0, 6622.0, 10483.0, 17187.0, 28040.0, 46916.0, 79576.0, 135187.0, 1228267.0, 214778.0, 128061.0, 75599.0, 44223.0, 26500.0, 16014.0, 10028.0, 6324.0, 4061.0, 2581.0, 1702.0, 1140.0, 702.0, 438.0, 288.0, 207.0, 142.0, 84.0, 42.0, 28.0, 27.0, 26.0, 12.0, 9.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.626953125, -0.60601806640625, -0.5850830078125, -0.56414794921875, -0.543212890625, -0.52227783203125, -0.5013427734375, -0.48040771484375, -0.45947265625, -0.43853759765625, -0.4176025390625, -0.39666748046875, -0.375732421875, -0.35479736328125, -0.3338623046875, -0.31292724609375, -0.2919921875, -0.27105712890625, -0.2501220703125, -0.22918701171875, -0.208251953125, -0.18731689453125, -0.1663818359375, -0.14544677734375, -0.12451171875, -0.10357666015625, -0.0826416015625, -0.06170654296875, -0.040771484375, -0.01983642578125, 0.0010986328125, 0.02203369140625, 0.04296875, 0.06390380859375, 0.0848388671875, 0.10577392578125, 0.126708984375, 0.14764404296875, 0.1685791015625, 0.18951416015625, 0.21044921875, 0.23138427734375, 0.2523193359375, 0.27325439453125, 0.294189453125, 0.31512451171875, 0.3360595703125, 0.35699462890625, 0.3779296875, 0.39886474609375, 0.4197998046875, 0.44073486328125, 0.461669921875, 0.48260498046875, 0.5035400390625, 0.52447509765625, 0.54541015625, 0.56634521484375, 0.5872802734375, 0.60821533203125, 0.629150390625, 0.65008544921875, 0.6710205078125, 0.69195556640625, 0.712890625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 1.0, 11.0, 16.0, 8.0, 13.0, 22.0, 30.0, 38.0, 49.0, 53.0, 70.0, 61.0, 60.0, 61.0, 79.0, 64.0, 68.0, 52.0, 59.0, 43.0, 34.0, 29.0, 24.0, 13.0, 13.0, 9.0, 5.0, 1.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025539398193359375, -0.002471059560775757, -0.002388179302215576, -0.0023052990436553955, -0.002222418785095215, -0.002139538526535034, -0.0020566582679748535, -0.001973778009414673, -0.0018908977508544922, -0.0018080174922943115, -0.0017251372337341309, -0.0016422569751739502, -0.0015593767166137695, -0.0014764964580535889, -0.0013936161994934082, -0.0013107359409332275, -0.0012278556823730469, -0.0011449754238128662, -0.0010620951652526855, -0.0009792149066925049, -0.0008963346481323242, -0.0008134543895721436, -0.0007305741310119629, -0.0006476938724517822, -0.0005648136138916016, -0.0004819333553314209, -0.00039905309677124023, -0.00031617283821105957, -0.0002332925796508789, -0.00015041232109069824, -6.753206253051758e-05, 1.5348196029663086e-05, 9.822845458984375e-05, 0.00018110871315002441, 0.0002639889717102051, 0.00034686923027038574, 0.0004297494888305664, 0.0005126297473907471, 0.0005955100059509277, 0.0006783902645111084, 0.0007612705230712891, 0.0008441507816314697, 0.0009270310401916504, 0.001009911298751831, 0.0010927915573120117, 0.0011756718158721924, 0.001258552074432373, 0.0013414323329925537, 0.0014243125915527344, 0.001507192850112915, 0.0015900731086730957, 0.0016729533672332764, 0.001755833625793457, 0.0018387138843536377, 0.0019215941429138184, 0.002004474401473999, 0.0020873546600341797, 0.0021702349185943604, 0.002253115177154541, 0.0023359954357147217, 0.0024188756942749023, 0.002501755952835083, 0.0025846362113952637, 0.0026675164699554443, 0.002750396728515625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 1.0, 12.0, 11.0, 12.0, 24.0, 31.0, 30.0, 52.0, 81.0, 93.0, 153.0, 299.0, 1391.0, 1033416.0, 11781.0, 535.0, 214.0, 121.0, 70.0, 64.0, 43.0, 30.0, 27.0, 11.0, 9.0, 15.0, 11.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.06536865234375, -0.0634307861328125, -0.061492919921875, -0.0595550537109375, -0.0576171875, -0.0556793212890625, -0.053741455078125, -0.0518035888671875, -0.04986572265625, -0.0479278564453125, -0.045989990234375, -0.0440521240234375, -0.0421142578125, -0.0401763916015625, -0.038238525390625, -0.0363006591796875, -0.03436279296875, -0.0324249267578125, -0.030487060546875, -0.0285491943359375, -0.026611328125, -0.0246734619140625, -0.022735595703125, -0.0207977294921875, -0.01885986328125, -0.0169219970703125, -0.014984130859375, -0.0130462646484375, -0.0111083984375, -0.0091705322265625, -0.007232666015625, -0.0052947998046875, -0.00335693359375, -0.0014190673828125, 0.000518798828125, 0.0024566650390625, 0.00439453125, 0.0063323974609375, 0.008270263671875, 0.0102081298828125, 0.01214599609375, 0.0140838623046875, 0.016021728515625, 0.0179595947265625, 0.0198974609375, 0.0218353271484375, 0.023773193359375, 0.0257110595703125, 0.02764892578125, 0.0295867919921875, 0.031524658203125, 0.0334625244140625, 0.035400390625, 0.0373382568359375, 0.039276123046875, 0.0412139892578125, 0.04315185546875, 0.0450897216796875, 0.047027587890625, 0.0489654541015625, 0.0509033203125, 0.0528411865234375, 0.054779052734375, 0.0567169189453125, 0.05865478515625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 45.0, 944.0, 29.0], "bins": [-0.027769215404987335, -0.027324730530381203, -0.02688024565577507, -0.02643575891852379, -0.025991274043917656, -0.025546789169311523, -0.02510230429470539, -0.02465781942009926, -0.024213332682847977, -0.023768847808241844, -0.02332436293363571, -0.02287987619638443, -0.022435391321778297, -0.021990906447172165, -0.021546421572566032, -0.0211019366979599, -0.020657451823353767, -0.020212966948747635, -0.019768482074141502, -0.01932399533689022, -0.018879510462284088, -0.018435025587677956, -0.017990540713071823, -0.01754605583846569, -0.017101570963859558, -0.016657086089253426, -0.016212601214647293, -0.01576811447739601, -0.015323629602789879, -0.014879144728183746, -0.014434659853577614, -0.013990174978971481, -0.013545687310397625, -0.013101202435791492, -0.012656716629862785, -0.012212231755256653, -0.01176774688065052, -0.011323261074721813, -0.01087877620011568, -0.010434290394186974, -0.009989805519580841, -0.009545320644974709, -0.009100834839046001, -0.008656349964439869, -0.008211864158511162, -0.007767379283905029, -0.007322894409298897, -0.006878409069031477, -0.0064339241944253445, -0.005989438854157925, -0.005544953979551792, -0.005100468639284372, -0.0046559832990169525, -0.004211497958749533, -0.0037670128513127565, -0.0033225277438759804, -0.0028780424036085606, -0.0024335570633411407, -0.0019890719559043646, -0.0015445867320522666, -0.0011001015082001686, -0.0006556161679327488, -0.00021113106049597263, 0.00023335404694080353, 0.0006778395036235452]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 4.0, 8.0, 9.0, 7.0, 4.0, 19.0, 20.0, 20.0, 19.0, 25.0, 27.0, 29.0, 34.0, 34.0, 27.0, 28.0, 34.0, 43.0, 31.0, 37.0, 36.0, 46.0, 39.0, 39.0, 46.0, 30.0, 33.0, 33.0, 31.0, 39.0, 36.0, 19.0, 16.0, 21.0, 12.0, 12.0, 11.0, 6.0, 9.0, 8.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009743571281433105, -0.0009409366175532341, -0.0009075161069631577, -0.0008740955963730812, -0.0008406750857830048, -0.0008072545751929283, -0.0007738340646028519, -0.0007404135540127754, -0.000706993043422699, -0.0006735725328326225, -0.0006401520222425461, -0.0006067315116524696, -0.0005733110010623932, -0.0005398904904723167, -0.0005064699798822403, -0.00047304946929216385, -0.0004396289587020874, -0.00040620844811201096, -0.0003727879375219345, -0.00033936742693185806, -0.0003059469163417816, -0.00027252640575170517, -0.00023910589516162872, -0.00020568538457155228, -0.00017226487398147583, -0.00013884436339139938, -0.00010542385280132294, -7.200334221124649e-05, -3.8582831621170044e-05, -5.162321031093597e-06, 2.825818955898285e-05, 6.16787001490593e-05, 9.509921073913574e-05, 0.0001285197213292122, 0.00016194023191928864, 0.00019536074250936508, 0.00022878125309944153, 0.000262201763689518, 0.0002956222742795944, 0.00032904278486967087, 0.0003624632954597473, 0.00039588380604982376, 0.0004293043166399002, 0.00046272482722997665, 0.0004961453378200531, 0.0005295658484101295, 0.000562986359000206, 0.0005964068695902824, 0.0006298273801803589, 0.0006632478907704353, 0.0006966684013605118, 0.0007300889119505882, 0.0007635094225406647, 0.0007969299331307411, 0.0008303504437208176, 0.000863770954310894, 0.0008971914649009705, 0.0009306119754910469, 0.0009640324860811234, 0.0009974529966711998, 0.0010308735072612762, 0.0010642940178513527, 0.0010977145284414291, 0.0011311350390315056, 0.001164555549621582]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 3.0, 6.0, 9.0, 12.0, 10.0, 10.0, 13.0, 10.0, 9.0, 18.0, 23.0, 26.0, 25.0, 20.0, 26.0, 19.0, 32.0, 29.0, 43.0, 45.0, 37.0, 47.0, 40.0, 32.0, 41.0, 34.0, 36.0, 28.0, 31.0, 47.0, 30.0, 24.0, 24.0, 15.0, 22.0, 21.0, 15.0, 13.0, 12.0, 16.0, 13.0, 6.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.234375, -6.04779052734375, -5.8612060546875, -5.67462158203125, -5.488037109375, -5.30145263671875, -5.1148681640625, -4.92828369140625, -4.74169921875, -4.55511474609375, -4.3685302734375, -4.18194580078125, -3.995361328125, -3.80877685546875, -3.6221923828125, -3.43560791015625, -3.2490234375, -3.06243896484375, -2.8758544921875, -2.68927001953125, -2.502685546875, -2.31610107421875, -2.1295166015625, -1.94293212890625, -1.75634765625, -1.56976318359375, -1.3831787109375, -1.19659423828125, -1.010009765625, -0.82342529296875, -0.6368408203125, -0.45025634765625, -0.263671875, -0.07708740234375, 0.1094970703125, 0.29608154296875, 0.482666015625, 0.66925048828125, 0.8558349609375, 1.04241943359375, 1.22900390625, 1.41558837890625, 1.6021728515625, 1.78875732421875, 1.975341796875, 2.16192626953125, 2.3485107421875, 2.53509521484375, 2.7216796875, 2.90826416015625, 3.0948486328125, 3.28143310546875, 3.468017578125, 3.65460205078125, 3.8411865234375, 4.02777099609375, 4.21435546875, 4.40093994140625, 4.5875244140625, 4.77410888671875, 4.960693359375, 5.14727783203125, 5.3338623046875, 5.52044677734375, 5.70703125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 12.0, 10.0, 22.0, 24.0, 33.0, 51.0, 90.0, 123.0, 198.0, 323.0, 498.0, 789.0, 1342.0, 2405.0, 4082.0, 7309.0, 12969.0, 25201.0, 53578.0, 128196.0, 323989.0, 279800.0, 110028.0, 47278.0, 22787.0, 11695.0, 6541.0, 3740.0, 2135.0, 1246.0, 747.0, 470.0, 290.0, 199.0, 112.0, 76.0, 43.0, 41.0, 13.0, 13.0, 16.0, 8.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.234375, -4.105743408203125, -3.97711181640625, -3.848480224609375, -3.7198486328125, -3.591217041015625, -3.46258544921875, -3.333953857421875, -3.205322265625, -3.076690673828125, -2.94805908203125, -2.819427490234375, -2.6907958984375, -2.562164306640625, -2.43353271484375, -2.304901123046875, -2.17626953125, -2.047637939453125, -1.91900634765625, -1.790374755859375, -1.6617431640625, -1.533111572265625, -1.40447998046875, -1.275848388671875, -1.147216796875, -1.018585205078125, -0.88995361328125, -0.761322021484375, -0.6326904296875, -0.504058837890625, -0.37542724609375, -0.246795654296875, -0.1181640625, 0.010467529296875, 0.13909912109375, 0.267730712890625, 0.3963623046875, 0.524993896484375, 0.65362548828125, 0.782257080078125, 0.910888671875, 1.039520263671875, 1.16815185546875, 1.296783447265625, 1.4254150390625, 1.554046630859375, 1.68267822265625, 1.811309814453125, 1.93994140625, 2.068572998046875, 2.19720458984375, 2.325836181640625, 2.4544677734375, 2.583099365234375, 2.71173095703125, 2.840362548828125, 2.968994140625, 3.097625732421875, 3.22625732421875, 3.354888916015625, 3.4835205078125, 3.612152099609375, 3.74078369140625, 3.869415283203125, 3.998046875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 7.0, 2.0, 11.0, 10.0, 13.0, 21.0, 16.0, 18.0, 28.0, 26.0, 21.0, 36.0, 33.0, 40.0, 37.0, 52.0, 57.0, 75.0, 320.0, 1606.0, 145.0, 53.0, 49.0, 50.0, 54.0, 28.0, 31.0, 26.0, 35.0, 27.0, 22.0, 18.0, 13.0, 15.0, 7.0, 6.0, 8.0, 5.0, 8.0, 3.0, 5.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-22.75, -22.0439453125, -21.337890625, -20.6318359375, -19.92578125, -19.2197265625, -18.513671875, -17.8076171875, -17.1015625, -16.3955078125, -15.689453125, -14.9833984375, -14.27734375, -13.5712890625, -12.865234375, -12.1591796875, -11.453125, -10.7470703125, -10.041015625, -9.3349609375, -8.62890625, -7.9228515625, -7.216796875, -6.5107421875, -5.8046875, -5.0986328125, -4.392578125, -3.6865234375, -2.98046875, -2.2744140625, -1.568359375, -0.8623046875, -0.15625, 0.5498046875, 1.255859375, 1.9619140625, 2.66796875, 3.3740234375, 4.080078125, 4.7861328125, 5.4921875, 6.1982421875, 6.904296875, 7.6103515625, 8.31640625, 9.0224609375, 9.728515625, 10.4345703125, 11.140625, 11.8466796875, 12.552734375, 13.2587890625, 13.96484375, 14.6708984375, 15.376953125, 16.0830078125, 16.7890625, 17.4951171875, 18.201171875, 18.9072265625, 19.61328125, 20.3193359375, 21.025390625, 21.7314453125, 22.4375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 6.0, 7.0, 0.0, 4.0, 10.0, 7.0, 5.0, 14.0, 15.0, 15.0, 45.0, 37.0, 45.0, 69.0, 64.0, 118.0, 156.0, 223.0, 331.0, 791.0, 6489.0, 3104170.0, 30736.0, 1041.0, 395.0, 230.0, 192.0, 135.0, 84.0, 74.0, 50.0, 34.0, 29.0, 29.0, 18.0, 14.0, 8.0, 5.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.09375, -49.10107421875, -47.1083984375, -45.11572265625, -43.123046875, -41.13037109375, -39.1376953125, -37.14501953125, -35.15234375, -33.15966796875, -31.1669921875, -29.17431640625, -27.181640625, -25.18896484375, -23.1962890625, -21.20361328125, -19.2109375, -17.21826171875, -15.2255859375, -13.23291015625, -11.240234375, -9.24755859375, -7.2548828125, -5.26220703125, -3.26953125, -1.27685546875, 0.7158203125, 2.70849609375, 4.701171875, 6.69384765625, 8.6865234375, 10.67919921875, 12.671875, 14.66455078125, 16.6572265625, 18.64990234375, 20.642578125, 22.63525390625, 24.6279296875, 26.62060546875, 28.61328125, 30.60595703125, 32.5986328125, 34.59130859375, 36.583984375, 38.57666015625, 40.5693359375, 42.56201171875, 44.5546875, 46.54736328125, 48.5400390625, 50.53271484375, 52.525390625, 54.51806640625, 56.5107421875, 58.50341796875, 60.49609375, 62.48876953125, 64.4814453125, 66.47412109375, 68.466796875, 70.45947265625, 72.4521484375, 74.44482421875, 76.4375]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 109.0, 880.0, 26.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.989105224609375, -14.817363739013672, -8.645621299743652, -2.473878860473633, 3.6978626251220703, 9.869604110717773, 16.04134750366211, 22.213088989257812, 28.384830474853516, 34.55657196044922, 40.72831344604492, 46.900054931640625, 53.071800231933594, 59.24353790283203, 65.415283203125, 71.58702087402344, 77.7587661743164, 83.93051147460938, 90.10224914550781, 96.27399444580078, 102.44573211669922, 108.61747741699219, 114.78921508789062, 120.9609603881836, 127.13270568847656, 133.304443359375, 139.4761962890625, 145.64793395996094, 151.81967163085938, 157.9914093017578, 164.1631622314453, 170.33489990234375, 176.5066375732422, 182.67837524414062, 188.85012817382812, 195.02186584472656, 201.193603515625, 207.36534118652344, 213.53709411621094, 219.70883178710938, 225.8805694580078, 232.05230712890625, 238.22406005859375, 244.3957977294922, 250.56753540039062, 256.7392883300781, 262.9110107421875, 269.082763671875, 275.2545166015625, 281.42626953125, 287.5979919433594, 293.7697448730469, 299.9414978027344, 306.11322021484375, 312.28497314453125, 318.45672607421875, 324.6284484863281, 330.8002014160156, 336.971923828125, 343.1436767578125, 349.3154296875, 355.4871520996094, 361.6589050292969, 367.83062744140625, 374.00238037109375]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 9.0, 6.0, 12.0, 8.0, 14.0, 13.0, 31.0, 22.0, 30.0, 25.0, 27.0, 34.0, 30.0, 34.0, 42.0, 31.0, 40.0, 44.0, 41.0, 43.0, 29.0, 47.0, 36.0, 34.0, 40.0, 46.0, 30.0, 30.0, 31.0, 21.0, 25.0, 15.0, 13.0, 17.0, 6.0, 7.0, 7.0, 7.0, 2.0, 1.0, 0.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-53.56270217895508, -51.846717834472656, -50.130733489990234, -48.41474914550781, -46.69876480102539, -44.98278045654297, -43.26679992675781, -41.550811767578125, -39.83483123779297, -38.11884689331055, -36.402862548828125, -34.6868782043457, -32.97089385986328, -31.25490951538086, -29.53892707824707, -27.82294273376465, -26.106956481933594, -24.390972137451172, -22.67498779296875, -20.959003448486328, -19.243019104003906, -17.527034759521484, -15.811052322387695, -14.095067977905273, -12.379083633422852, -10.66309928894043, -8.947114944458008, -7.231131553649902, -5.5151472091674805, -3.7991628646850586, -2.083179473876953, -0.36719512939453125, 1.3487892150878906, 3.0647733211517334, 4.780757427215576, 6.49674129486084, 8.212725639343262, 9.928709983825684, 11.644693374633789, 13.360677719116211, 15.076662063598633, 16.792646408081055, 18.508630752563477, 20.224613189697266, 21.940597534179688, 23.65658187866211, 25.37256622314453, 27.088550567626953, 28.804534912109375, 30.520519256591797, 32.23650360107422, 33.95248794555664, 35.66847229003906, 37.384456634521484, 39.100440979003906, 40.81642150878906, 42.53240966796875, 44.24839401245117, 45.964378356933594, 47.680362701416016, 49.39634704589844, 51.11233139038086, 52.82831573486328, 54.54429626464844, 56.26028060913086]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 7.0, 7.0, 5.0, 5.0, 14.0, 15.0, 10.0, 10.0, 13.0, 16.0, 20.0, 22.0, 20.0, 17.0, 26.0, 30.0, 25.0, 31.0, 39.0, 45.0, 40.0, 35.0, 41.0, 40.0, 44.0, 29.0, 42.0, 32.0, 28.0, 37.0, 30.0, 33.0, 19.0, 26.0, 23.0, 18.0, 13.0, 19.0, 11.0, 8.0, 14.0, 11.0, 9.0, 6.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-6.7421875, -6.54766845703125, -6.3531494140625, -6.15863037109375, -5.964111328125, -5.76959228515625, -5.5750732421875, -5.38055419921875, -5.18603515625, -4.99151611328125, -4.7969970703125, -4.60247802734375, -4.407958984375, -4.21343994140625, -4.0189208984375, -3.82440185546875, -3.6298828125, -3.43536376953125, -3.2408447265625, -3.04632568359375, -2.851806640625, -2.65728759765625, -2.4627685546875, -2.26824951171875, -2.07373046875, -1.87921142578125, -1.6846923828125, -1.49017333984375, -1.295654296875, -1.10113525390625, -0.9066162109375, -0.71209716796875, -0.517578125, -0.32305908203125, -0.1285400390625, 0.06597900390625, 0.260498046875, 0.45501708984375, 0.6495361328125, 0.84405517578125, 1.03857421875, 1.23309326171875, 1.4276123046875, 1.62213134765625, 1.816650390625, 2.01116943359375, 2.2056884765625, 2.40020751953125, 2.5947265625, 2.78924560546875, 2.9837646484375, 3.17828369140625, 3.372802734375, 3.56732177734375, 3.7618408203125, 3.95635986328125, 4.15087890625, 4.34539794921875, 4.5399169921875, 4.73443603515625, 4.928955078125, 5.12347412109375, 5.3179931640625, 5.51251220703125, 5.70703125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 1.0, 6.0, 13.0, 8.0, 7.0, 10.0, 11.0, 11.0, 13.0, 19.0, 27.0, 27.0, 25.0, 55.0, 58.0, 84.0, 126.0, 246.0, 675.0, 2192.0, 12812.0, 372773.0, 3340456.0, 447050.0, 13743.0, 2305.0, 705.0, 300.0, 139.0, 86.0, 48.0, 45.0, 35.0, 19.0, 15.0, 25.0, 15.0, 18.0, 9.0, 10.0, 11.0, 8.0, 9.0, 7.0, 6.0, 5.0, 2.0, 2.0, 0.0, 3.0, 3.0], "bins": [-23.40625, -22.747314453125, -22.08837890625, -21.429443359375, -20.7705078125, -20.111572265625, -19.45263671875, -18.793701171875, -18.134765625, -17.475830078125, -16.81689453125, -16.157958984375, -15.4990234375, -14.840087890625, -14.18115234375, -13.522216796875, -12.86328125, -12.204345703125, -11.54541015625, -10.886474609375, -10.2275390625, -9.568603515625, -8.90966796875, -8.250732421875, -7.591796875, -6.932861328125, -6.27392578125, -5.614990234375, -4.9560546875, -4.297119140625, -3.63818359375, -2.979248046875, -2.3203125, -1.661376953125, -1.00244140625, -0.343505859375, 0.3154296875, 0.974365234375, 1.63330078125, 2.292236328125, 2.951171875, 3.610107421875, 4.26904296875, 4.927978515625, 5.5869140625, 6.245849609375, 6.90478515625, 7.563720703125, 8.22265625, 8.881591796875, 9.54052734375, 10.199462890625, 10.8583984375, 11.517333984375, 12.17626953125, 12.835205078125, 13.494140625, 14.153076171875, 14.81201171875, 15.470947265625, 16.1298828125, 16.788818359375, 17.44775390625, 18.106689453125, 18.765625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 8.0, 12.0, 21.0, 13.0, 42.0, 65.0, 89.0, 126.0, 230.0, 319.0, 416.0, 588.0, 620.0, 459.0, 334.0, 222.0, 160.0, 109.0, 91.0, 52.0, 28.0, 19.0, 19.0, 8.0, 7.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.078125, -16.591796875, -16.10546875, -15.619140625, -15.1328125, -14.646484375, -14.16015625, -13.673828125, -13.1875, -12.701171875, -12.21484375, -11.728515625, -11.2421875, -10.755859375, -10.26953125, -9.783203125, -9.296875, -8.810546875, -8.32421875, -7.837890625, -7.3515625, -6.865234375, -6.37890625, -5.892578125, -5.40625, -4.919921875, -4.43359375, -3.947265625, -3.4609375, -2.974609375, -2.48828125, -2.001953125, -1.515625, -1.029296875, -0.54296875, -0.056640625, 0.4296875, 0.916015625, 1.40234375, 1.888671875, 2.375, 2.861328125, 3.34765625, 3.833984375, 4.3203125, 4.806640625, 5.29296875, 5.779296875, 6.265625, 6.751953125, 7.23828125, 7.724609375, 8.2109375, 8.697265625, 9.18359375, 9.669921875, 10.15625, 10.642578125, 11.12890625, 11.615234375, 12.1015625, 12.587890625, 13.07421875, 13.560546875, 14.046875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 5.0, 7.0, 7.0, 15.0, 27.0, 33.0, 45.0, 49.0, 74.0, 98.0, 145.0, 169.0, 291.0, 344.0, 809.0, 3667.0, 1216392.0, 2964322.0, 5538.0, 849.0, 415.0, 315.0, 183.0, 121.0, 112.0, 77.0, 47.0, 36.0, 27.0, 18.0, 13.0, 13.0, 10.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.53125, -58.58251953125, -56.6337890625, -54.68505859375, -52.736328125, -50.78759765625, -48.8388671875, -46.89013671875, -44.94140625, -42.99267578125, -41.0439453125, -39.09521484375, -37.146484375, -35.19775390625, -33.2490234375, -31.30029296875, -29.3515625, -27.40283203125, -25.4541015625, -23.50537109375, -21.556640625, -19.60791015625, -17.6591796875, -15.71044921875, -13.76171875, -11.81298828125, -9.8642578125, -7.91552734375, -5.966796875, -4.01806640625, -2.0693359375, -0.12060546875, 1.828125, 3.77685546875, 5.7255859375, 7.67431640625, 9.623046875, 11.57177734375, 13.5205078125, 15.46923828125, 17.41796875, 19.36669921875, 21.3154296875, 23.26416015625, 25.212890625, 27.16162109375, 29.1103515625, 31.05908203125, 33.0078125, 34.95654296875, 36.9052734375, 38.85400390625, 40.802734375, 42.75146484375, 44.7001953125, 46.64892578125, 48.59765625, 50.54638671875, 52.4951171875, 54.44384765625, 56.392578125, 58.34130859375, 60.2900390625, 62.23876953125, 64.1875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 9.0, 21.0, 68.0, 131.0, 207.0, 221.0, 163.0, 111.0, 57.0, 13.0, 9.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.02861404418945, -45.37352752685547, -42.71844482421875, -40.063358306884766, -37.40827560424805, -34.75318908691406, -32.098106384277344, -29.44301986694336, -26.787935256958008, -24.132850646972656, -21.477766036987305, -18.822681427001953, -16.16759490966797, -13.512511253356934, -10.857425689697266, -8.202341079711914, -5.5472564697265625, -2.892171621322632, -0.23708677291870117, 2.4179983139038086, 5.07308292388916, 7.728167533874512, 10.38325309753418, 13.038337707519531, 15.693422317504883, 18.348506927490234, 21.003591537475586, 23.658676147460938, 26.313762664794922, 28.96884536743164, 31.623931884765625, 34.279014587402344, 36.934104919433594, 39.58919143676758, 42.2442741394043, 44.89936065673828, 47.554443359375, 50.209529876708984, 52.86461639404297, 55.51969909667969, 58.174781799316406, 60.82986831665039, 63.48495101928711, 66.1400375366211, 68.79512023925781, 71.45020294189453, 74.10529327392578, 76.7603759765625, 79.41546630859375, 82.07054901123047, 84.72563934326172, 87.38072204589844, 90.03580474853516, 92.69088745117188, 95.34597778320312, 98.00106048583984, 100.65614318847656, 103.31122589111328, 105.96631622314453, 108.62139892578125, 111.27648162841797, 113.93156433105469, 116.58665466308594, 119.24173736572266, 121.89682006835938]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 8.0, 9.0, 8.0, 7.0, 15.0, 7.0, 21.0, 15.0, 25.0, 24.0, 27.0, 33.0, 39.0, 36.0, 46.0, 53.0, 42.0, 36.0, 48.0, 41.0, 47.0, 41.0, 44.0, 37.0, 35.0, 31.0, 32.0, 26.0, 33.0, 18.0, 15.0, 23.0, 8.0, 9.0, 12.0, 8.0, 11.0, 8.0, 4.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-42.177490234375, -40.9301872253418, -39.682884216308594, -38.43558120727539, -37.18827819824219, -35.94097137451172, -34.693668365478516, -33.44636535644531, -32.19906234741211, -30.951759338378906, -29.704456329345703, -28.457151412963867, -27.209848403930664, -25.96254539489746, -24.715240478515625, -23.467937469482422, -22.22063446044922, -20.973331451416016, -19.726028442382812, -18.478723526000977, -17.231420516967773, -15.98411750793457, -14.73681354522705, -13.489509582519531, -12.242206573486328, -10.994903564453125, -9.747599601745605, -8.500295639038086, -7.252992630004883, -6.0056891441345215, -4.75838565826416, -3.5110816955566406, -2.2637786865234375, -1.0164752006530762, 0.23082828521728516, 1.4781317710876465, 2.725435256958008, 3.972738742828369, 5.2200422286987305, 6.46734619140625, 7.714649200439453, 8.961952209472656, 10.209256172180176, 11.456560134887695, 12.703863143920898, 13.951166152954102, 15.198470115661621, 16.44577407836914, 17.693077087402344, 18.940380096435547, 20.18768310546875, 21.434988021850586, 22.68229103088379, 23.929594039916992, 25.176898956298828, 26.42420196533203, 27.671504974365234, 28.918807983398438, 30.16611099243164, 31.413415908813477, 32.66072082519531, 33.908023834228516, 35.15532684326172, 36.40262985229492, 37.649932861328125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 5.0, 10.0, 9.0, 9.0, 16.0, 21.0, 12.0, 15.0, 12.0, 17.0, 28.0, 27.0, 22.0, 31.0, 29.0, 35.0, 38.0, 37.0, 39.0, 43.0, 46.0, 56.0, 42.0, 35.0, 44.0, 37.0, 32.0, 34.0, 27.0, 15.0, 22.0, 30.0, 18.0, 17.0, 7.0, 13.0, 11.0, 6.0, 10.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.859375, -6.66290283203125, -6.4664306640625, -6.26995849609375, -6.073486328125, -5.87701416015625, -5.6805419921875, -5.48406982421875, -5.28759765625, -5.09112548828125, -4.8946533203125, -4.69818115234375, -4.501708984375, -4.30523681640625, -4.1087646484375, -3.91229248046875, -3.7158203125, -3.51934814453125, -3.3228759765625, -3.12640380859375, -2.929931640625, -2.73345947265625, -2.5369873046875, -2.34051513671875, -2.14404296875, -1.94757080078125, -1.7510986328125, -1.55462646484375, -1.358154296875, -1.16168212890625, -0.9652099609375, -0.76873779296875, -0.572265625, -0.37579345703125, -0.1793212890625, 0.01715087890625, 0.213623046875, 0.41009521484375, 0.6065673828125, 0.80303955078125, 0.99951171875, 1.19598388671875, 1.3924560546875, 1.58892822265625, 1.785400390625, 1.98187255859375, 2.1783447265625, 2.37481689453125, 2.5712890625, 2.76776123046875, 2.9642333984375, 3.16070556640625, 3.357177734375, 3.55364990234375, 3.7501220703125, 3.94659423828125, 4.14306640625, 4.33953857421875, 4.5360107421875, 4.73248291015625, 4.928955078125, 5.12542724609375, 5.3218994140625, 5.51837158203125, 5.71484375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 7.0, 6.0, 8.0, 15.0, 10.0, 25.0, 50.0, 62.0, 85.0, 174.0, 234.0, 294.0, 428.0, 686.0, 997.0, 1451.0, 2104.0, 3151.0, 4660.0, 7099.0, 10690.0, 16302.0, 24752.0, 38790.0, 61036.0, 98518.0, 151838.0, 188644.0, 156720.0, 101602.0, 62894.0, 40007.0, 25575.0, 16716.0, 10826.0, 7302.0, 4855.0, 3314.0, 2170.0, 1353.0, 1012.0, 634.0, 458.0, 308.0, 236.0, 146.0, 94.0, 81.0, 50.0, 30.0, 19.0, 15.0, 15.0, 4.0, 4.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.59326171875, -0.5731735229492188, -0.5530853271484375, -0.5329971313476562, -0.512908935546875, -0.49282073974609375, -0.4727325439453125, -0.45264434814453125, -0.43255615234375, -0.41246795654296875, -0.3923797607421875, -0.37229156494140625, -0.352203369140625, -0.33211517333984375, -0.3120269775390625, -0.29193878173828125, -0.2718505859375, -0.25176239013671875, -0.2316741943359375, -0.21158599853515625, -0.191497802734375, -0.17140960693359375, -0.1513214111328125, -0.13123321533203125, -0.11114501953125, -0.09105682373046875, -0.0709686279296875, -0.05088043212890625, -0.030792236328125, -0.01070404052734375, 0.0093841552734375, 0.02947235107421875, 0.049560546875, 0.06964874267578125, 0.0897369384765625, 0.10982513427734375, 0.129913330078125, 0.15000152587890625, 0.1700897216796875, 0.19017791748046875, 0.21026611328125, 0.23035430908203125, 0.2504425048828125, 0.27053070068359375, 0.290618896484375, 0.31070709228515625, 0.3307952880859375, 0.35088348388671875, 0.3709716796875, 0.39105987548828125, 0.4111480712890625, 0.43123626708984375, 0.451324462890625, 0.47141265869140625, 0.4915008544921875, 0.5115890502929688, 0.53167724609375, 0.5517654418945312, 0.5718536376953125, 0.5919418334960938, 0.612030029296875, 0.6321182250976562, 0.6522064208984375, 0.6722946166992188, 0.6923828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 5.0, 2.0, 8.0, 13.0, 9.0, 7.0, 15.0, 15.0, 20.0, 15.0, 23.0, 31.0, 31.0, 30.0, 36.0, 37.0, 32.0, 35.0, 48.0, 39.0, 42.0, 1069.0, 32.0, 41.0, 41.0, 39.0, 37.0, 26.0, 25.0, 34.0, 28.0, 28.0, 26.0, 21.0, 14.0, 7.0, 8.0, 5.0, 11.0, 9.0, 7.0, 4.0, 5.0, 8.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.00390625, -3.875244140625, -3.74658203125, -3.617919921875, -3.4892578125, -3.360595703125, -3.23193359375, -3.103271484375, -2.974609375, -2.845947265625, -2.71728515625, -2.588623046875, -2.4599609375, -2.331298828125, -2.20263671875, -2.073974609375, -1.9453125, -1.816650390625, -1.68798828125, -1.559326171875, -1.4306640625, -1.302001953125, -1.17333984375, -1.044677734375, -0.916015625, -0.787353515625, -0.65869140625, -0.530029296875, -0.4013671875, -0.272705078125, -0.14404296875, -0.015380859375, 0.11328125, 0.241943359375, 0.37060546875, 0.499267578125, 0.6279296875, 0.756591796875, 0.88525390625, 1.013916015625, 1.142578125, 1.271240234375, 1.39990234375, 1.528564453125, 1.6572265625, 1.785888671875, 1.91455078125, 2.043212890625, 2.171875, 2.300537109375, 2.42919921875, 2.557861328125, 2.6865234375, 2.815185546875, 2.94384765625, 3.072509765625, 3.201171875, 3.329833984375, 3.45849609375, 3.587158203125, 3.7158203125, 3.844482421875, 3.97314453125, 4.101806640625, 4.23046875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [5.0, 2.0, 0.0, 3.0, 1.0, 2.0, 8.0, 9.0, 18.0, 21.0, 36.0, 44.0, 74.0, 98.0, 169.0, 266.0, 373.0, 656.0, 959.0, 1713.0, 2589.0, 4182.0, 6810.0, 11140.0, 18540.0, 31202.0, 53429.0, 94529.0, 161808.0, 1267066.0, 180257.0, 109545.0, 62044.0, 35254.0, 21169.0, 12714.0, 7774.0, 4847.0, 2944.0, 1739.0, 1084.0, 643.0, 484.0, 314.0, 201.0, 141.0, 78.0, 57.0, 33.0, 29.0, 14.0, 12.0, 7.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6552734375, -0.6331558227539062, -0.6110382080078125, -0.5889205932617188, -0.566802978515625, -0.5446853637695312, -0.5225677490234375, -0.5004501342773438, -0.47833251953125, -0.45621490478515625, -0.4340972900390625, -0.41197967529296875, -0.389862060546875, -0.36774444580078125, -0.3456268310546875, -0.32350921630859375, -0.3013916015625, -0.27927398681640625, -0.2571563720703125, -0.23503875732421875, -0.212921142578125, -0.19080352783203125, -0.1686859130859375, -0.14656829833984375, -0.12445068359375, -0.10233306884765625, -0.0802154541015625, -0.05809783935546875, -0.035980224609375, -0.01386260986328125, 0.0082550048828125, 0.03037261962890625, 0.052490234375, 0.07460784912109375, 0.0967254638671875, 0.11884307861328125, 0.140960693359375, 0.16307830810546875, 0.1851959228515625, 0.20731353759765625, 0.22943115234375, 0.25154876708984375, 0.2736663818359375, 0.29578399658203125, 0.317901611328125, 0.34001922607421875, 0.3621368408203125, 0.38425445556640625, 0.4063720703125, 0.42848968505859375, 0.4506072998046875, 0.47272491455078125, 0.494842529296875, 0.5169601440429688, 0.5390777587890625, 0.5611953735351562, 0.58331298828125, 0.6054306030273438, 0.6275482177734375, 0.6496658325195312, 0.671783447265625, 0.6939010620117188, 0.7160186767578125, 0.7381362915039062, 0.76025390625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 4.0, 1.0, 4.0, 5.0, 7.0, 8.0, 9.0, 13.0, 12.0, 12.0, 20.0, 17.0, 20.0, 35.0, 35.0, 35.0, 60.0, 48.0, 62.0, 42.0, 50.0, 59.0, 53.0, 52.0, 50.0, 36.0, 46.0, 27.0, 27.0, 29.0, 20.0, 24.0, 13.0, 14.0, 11.0, 5.0, 7.0, 4.0, 3.0, 5.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.0019083023071289062, -0.001855015754699707, -0.0018017292022705078, -0.0017484426498413086, -0.0016951560974121094, -0.0016418695449829102, -0.001588582992553711, -0.0015352964401245117, -0.0014820098876953125, -0.0014287233352661133, -0.001375436782836914, -0.0013221502304077148, -0.0012688636779785156, -0.0012155771255493164, -0.0011622905731201172, -0.001109004020690918, -0.0010557174682617188, -0.0010024309158325195, -0.0009491443634033203, -0.0008958578109741211, -0.0008425712585449219, -0.0007892847061157227, -0.0007359981536865234, -0.0006827116012573242, -0.000629425048828125, -0.0005761384963989258, -0.0005228519439697266, -0.00046956539154052734, -0.0004162788391113281, -0.0003629922866821289, -0.0003097057342529297, -0.00025641918182373047, -0.00020313262939453125, -0.00014984607696533203, -9.655952453613281e-05, -4.3272972106933594e-05, 1.0013580322265625e-05, 6.330013275146484e-05, 0.00011658668518066406, 0.00016987323760986328, 0.0002231597900390625, 0.0002764463424682617, 0.00032973289489746094, 0.00038301944732666016, 0.0004363059997558594, 0.0004895925521850586, 0.0005428791046142578, 0.000596165657043457, 0.0006494522094726562, 0.0007027387619018555, 0.0007560253143310547, 0.0008093118667602539, 0.0008625984191894531, 0.0009158849716186523, 0.0009691715240478516, 0.0010224580764770508, 0.00107574462890625, 0.0011290311813354492, 0.0011823177337646484, 0.0012356042861938477, 0.0012888908386230469, 0.001342177391052246, 0.0013954639434814453, 0.0014487504959106445, 0.0015020370483398438]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 5.0, 7.0, 12.0, 17.0, 14.0, 16.0, 42.0, 43.0, 50.0, 63.0, 91.0, 158.0, 262.0, 794.0, 21558.0, 1022278.0, 1963.0, 490.0, 194.0, 111.0, 96.0, 61.0, 59.0, 34.0, 29.0, 18.0, 13.0, 14.0, 11.0, 6.0, 4.0, 6.0, 4.0, 2.0, 5.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03631591796875, -0.03493499755859375, -0.0335540771484375, -0.03217315673828125, -0.030792236328125, -0.02941131591796875, -0.0280303955078125, -0.02664947509765625, -0.0252685546875, -0.02388763427734375, -0.0225067138671875, -0.02112579345703125, -0.019744873046875, -0.01836395263671875, -0.0169830322265625, -0.01560211181640625, -0.01422119140625, -0.01284027099609375, -0.0114593505859375, -0.01007843017578125, -0.008697509765625, -0.00731658935546875, -0.0059356689453125, -0.00455474853515625, -0.003173828125, -0.00179290771484375, -0.0004119873046875, 0.00096893310546875, 0.002349853515625, 0.00373077392578125, 0.0051116943359375, 0.00649261474609375, 0.00787353515625, 0.00925445556640625, 0.0106353759765625, 0.01201629638671875, 0.013397216796875, 0.01477813720703125, 0.0161590576171875, 0.01753997802734375, 0.0189208984375, 0.02030181884765625, 0.0216827392578125, 0.02306365966796875, 0.024444580078125, 0.02582550048828125, 0.0272064208984375, 0.02858734130859375, 0.02996826171875, 0.03134918212890625, 0.0327301025390625, 0.03411102294921875, 0.035491943359375, 0.03687286376953125, 0.0382537841796875, 0.03963470458984375, 0.041015625, 0.04239654541015625, 0.0437774658203125, 0.04515838623046875, 0.046539306640625, 0.04792022705078125, 0.0493011474609375, 0.05068206787109375, 0.05206298828125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 20.0, 356.0, 583.0, 57.0, 2.0, 1.0], "bins": [-0.013125949539244175, -0.012907786294817924, -0.012689623050391674, -0.012471459805965424, -0.012253296561539173, -0.012035133317112923, -0.011816970072686672, -0.011598806828260422, -0.011380643583834171, -0.01116248033940792, -0.01094431709498167, -0.01072615385055542, -0.01050799060612917, -0.010289827361702919, -0.010071664117276669, -0.009853500872850418, -0.009635338559746742, -0.009417175315320492, -0.009199012070894241, -0.008980848826467991, -0.00876268558204174, -0.00854452233761549, -0.00832635909318924, -0.008108195848762989, -0.007890032604336739, -0.007671869359910488, -0.007453706115484238, -0.007235542871057987, -0.007017379626631737, -0.006799216382205486, -0.006581053137779236, -0.006362890359014273, -0.006144726648926735, -0.0059265634045004845, -0.005708400160074234, -0.0054902369156479836, -0.005272073671221733, -0.005053910426795483, -0.004835747182369232, -0.004617584403604269, -0.004399421159178019, -0.004181257914751768, -0.003963094670325518, -0.003744931425899267, -0.0035267684143036604, -0.00330860516987741, -0.0030904419254511595, -0.0028722789138555527, -0.002654115669429302, -0.0024359524250030518, -0.0022177891805768013, -0.001999625936150551, -0.001781462924554944, -0.0015632996801286936, -0.0013451364357024431, -0.0011269733076915145, -0.0009088100050576031, -0.0006906468188390136, -0.0004724836035165936, -0.0002543203881941736, -3.615720197558403e-05, 0.00018200598424300551, 0.00040016922866925597, 0.0006183323566801846, 0.0008364956011064351]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 4.0, 5.0, 2.0, 8.0, 4.0, 11.0, 6.0, 9.0, 9.0, 12.0, 20.0, 18.0, 23.0, 22.0, 32.0, 25.0, 31.0, 25.0, 27.0, 41.0, 40.0, 47.0, 43.0, 39.0, 39.0, 37.0, 32.0, 31.0, 34.0, 25.0, 37.0, 28.0, 29.0, 31.0, 25.0, 29.0, 25.0, 10.0, 20.0, 7.0, 15.0, 11.0, 4.0, 14.0, 6.0, 5.0, 2.0, 6.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0009667873382568359, -0.0009379889816045761, -0.0009091906249523163, -0.0008803922683000565, -0.0008515939116477966, -0.0008227955549955368, -0.000793997198343277, -0.0007651988416910172, -0.0007364004850387573, -0.0007076021283864975, -0.0006788037717342377, -0.0006500054150819778, -0.000621207058429718, -0.0005924087017774582, -0.0005636103451251984, -0.0005348119884729385, -0.0005060136318206787, -0.0004772152751684189, -0.00044841691851615906, -0.00041961856186389923, -0.0003908202052116394, -0.0003620218485593796, -0.00033322349190711975, -0.0003044251352548599, -0.0002756267786026001, -0.00024682842195034027, -0.00021803006529808044, -0.00018923170864582062, -0.0001604333519935608, -0.00013163499534130096, -0.00010283663868904114, -7.403828203678131e-05, -4.5239925384521484e-05, -1.6441568732261658e-05, 1.2356787919998169e-05, 4.1155144572257996e-05, 6.995350122451782e-05, 9.875185787677765e-05, 0.00012755021452903748, 0.0001563485711812973, 0.00018514692783355713, 0.00021394528448581696, 0.00024274364113807678, 0.0002715419977903366, 0.00030034035444259644, 0.00032913871109485626, 0.0003579370677471161, 0.0003867354243993759, 0.00041553378105163574, 0.00044433213770389557, 0.0004731304943561554, 0.0005019288510084152, 0.000530727207660675, 0.0005595255643129349, 0.0005883239209651947, 0.0006171222776174545, 0.0006459206342697144, 0.0006747189909219742, 0.000703517347574234, 0.0007323157042264938, 0.0007611140608787537, 0.0007899124175310135, 0.0008187107741832733, 0.0008475091308355331, 0.000876307487487793]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 5.0, 10.0, 9.0, 9.0, 16.0, 21.0, 12.0, 15.0, 12.0, 17.0, 28.0, 27.0, 22.0, 31.0, 29.0, 35.0, 38.0, 37.0, 39.0, 43.0, 46.0, 56.0, 42.0, 35.0, 44.0, 37.0, 32.0, 34.0, 27.0, 15.0, 22.0, 30.0, 18.0, 17.0, 7.0, 13.0, 11.0, 6.0, 10.0, 6.0, 4.0, 4.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.859375, -6.66290283203125, -6.4664306640625, -6.26995849609375, -6.073486328125, -5.87701416015625, -5.6805419921875, -5.48406982421875, -5.28759765625, -5.09112548828125, -4.8946533203125, -4.69818115234375, -4.501708984375, -4.30523681640625, -4.1087646484375, -3.91229248046875, -3.7158203125, -3.51934814453125, -3.3228759765625, -3.12640380859375, -2.929931640625, -2.73345947265625, -2.5369873046875, -2.34051513671875, -2.14404296875, -1.94757080078125, -1.7510986328125, -1.55462646484375, -1.358154296875, -1.16168212890625, -0.9652099609375, -0.76873779296875, -0.572265625, -0.37579345703125, -0.1793212890625, 0.01715087890625, 0.213623046875, 0.41009521484375, 0.6065673828125, 0.80303955078125, 0.99951171875, 1.19598388671875, 1.3924560546875, 1.58892822265625, 1.785400390625, 1.98187255859375, 2.1783447265625, 2.37481689453125, 2.5712890625, 2.76776123046875, 2.9642333984375, 3.16070556640625, 3.357177734375, 3.55364990234375, 3.7501220703125, 3.94659423828125, 4.14306640625, 4.33953857421875, 4.5360107421875, 4.73248291015625, 4.928955078125, 5.12542724609375, 5.3218994140625, 5.51837158203125, 5.71484375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 5.0, 1.0, 9.0, 13.0, 7.0, 18.0, 15.0, 26.0, 25.0, 47.0, 55.0, 58.0, 88.0, 126.0, 142.0, 225.0, 360.0, 641.0, 1296.0, 2819.0, 6933.0, 18537.0, 50616.0, 150368.0, 471330.0, 229609.0, 72152.0, 25767.0, 9636.0, 3723.0, 1652.0, 771.0, 443.0, 316.0, 210.0, 122.0, 94.0, 73.0, 60.0, 47.0, 30.0, 21.0, 16.0, 18.0, 10.0, 8.0, 5.0, 7.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-6.92578125, -6.72601318359375, -6.5262451171875, -6.32647705078125, -6.126708984375, -5.92694091796875, -5.7271728515625, -5.52740478515625, -5.32763671875, -5.12786865234375, -4.9281005859375, -4.72833251953125, -4.528564453125, -4.32879638671875, -4.1290283203125, -3.92926025390625, -3.7294921875, -3.52972412109375, -3.3299560546875, -3.13018798828125, -2.930419921875, -2.73065185546875, -2.5308837890625, -2.33111572265625, -2.13134765625, -1.93157958984375, -1.7318115234375, -1.53204345703125, -1.332275390625, -1.13250732421875, -0.9327392578125, -0.73297119140625, -0.533203125, -0.33343505859375, -0.1336669921875, 0.06610107421875, 0.265869140625, 0.46563720703125, 0.6654052734375, 0.86517333984375, 1.06494140625, 1.26470947265625, 1.4644775390625, 1.66424560546875, 1.864013671875, 2.06378173828125, 2.2635498046875, 2.46331787109375, 2.6630859375, 2.86285400390625, 3.0626220703125, 3.26239013671875, 3.462158203125, 3.66192626953125, 3.8616943359375, 4.06146240234375, 4.26123046875, 4.46099853515625, 4.6607666015625, 4.86053466796875, 5.060302734375, 5.26007080078125, 5.4598388671875, 5.65960693359375, 5.859375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 7.0, 4.0, 6.0, 13.0, 10.0, 11.0, 18.0, 24.0, 28.0, 28.0, 39.0, 40.0, 69.0, 43.0, 66.0, 124.0, 1648.0, 383.0, 115.0, 55.0, 52.0, 63.0, 45.0, 28.0, 31.0, 21.0, 18.0, 11.0, 16.0, 11.0, 11.0, 11.0, 0.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.703125, -28.82666015625, -27.9501953125, -27.07373046875, -26.197265625, -25.32080078125, -24.4443359375, -23.56787109375, -22.69140625, -21.81494140625, -20.9384765625, -20.06201171875, -19.185546875, -18.30908203125, -17.4326171875, -16.55615234375, -15.6796875, -14.80322265625, -13.9267578125, -13.05029296875, -12.173828125, -11.29736328125, -10.4208984375, -9.54443359375, -8.66796875, -7.79150390625, -6.9150390625, -6.03857421875, -5.162109375, -4.28564453125, -3.4091796875, -2.53271484375, -1.65625, -0.77978515625, 0.0966796875, 0.97314453125, 1.849609375, 2.72607421875, 3.6025390625, 4.47900390625, 5.35546875, 6.23193359375, 7.1083984375, 7.98486328125, 8.861328125, 9.73779296875, 10.6142578125, 11.49072265625, 12.3671875, 13.24365234375, 14.1201171875, 14.99658203125, 15.873046875, 16.74951171875, 17.6259765625, 18.50244140625, 19.37890625, 20.25537109375, 21.1318359375, 22.00830078125, 22.884765625, 23.76123046875, 24.6376953125, 25.51416015625, 26.390625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 5.0, 7.0, 9.0, 7.0, 19.0, 21.0, 22.0, 25.0, 42.0, 57.0, 76.0, 94.0, 151.0, 225.0, 438.0, 1022.0, 15095.0, 3112747.0, 13478.0, 968.0, 396.0, 263.0, 158.0, 101.0, 65.0, 48.0, 48.0, 28.0, 23.0, 24.0, 9.0, 7.0, 8.0, 3.0, 10.0, 4.0, 2.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-63.4375, -61.4228515625, -59.408203125, -57.3935546875, -55.37890625, -53.3642578125, -51.349609375, -49.3349609375, -47.3203125, -45.3056640625, -43.291015625, -41.2763671875, -39.26171875, -37.2470703125, -35.232421875, -33.2177734375, -31.203125, -29.1884765625, -27.173828125, -25.1591796875, -23.14453125, -21.1298828125, -19.115234375, -17.1005859375, -15.0859375, -13.0712890625, -11.056640625, -9.0419921875, -7.02734375, -5.0126953125, -2.998046875, -0.9833984375, 1.03125, 3.0458984375, 5.060546875, 7.0751953125, 9.08984375, 11.1044921875, 13.119140625, 15.1337890625, 17.1484375, 19.1630859375, 21.177734375, 23.1923828125, 25.20703125, 27.2216796875, 29.236328125, 31.2509765625, 33.265625, 35.2802734375, 37.294921875, 39.3095703125, 41.32421875, 43.3388671875, 45.353515625, 47.3681640625, 49.3828125, 51.3974609375, 53.412109375, 55.4267578125, 57.44140625, 59.4560546875, 61.470703125, 63.4853515625, 65.5]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 16.0, 61.0, 150.0, 277.0, 268.0, 154.0, 64.0, 11.0, 5.0, 1.0, 0.0, 1.0], "bins": [-83.46466064453125, -81.97505950927734, -80.48545837402344, -78.99585723876953, -77.50625610351562, -76.01665496826172, -74.52705383300781, -73.03746032714844, -71.54785919189453, -70.05825805664062, -68.56865692138672, -67.07905578613281, -65.5894546508789, -64.099853515625, -62.61025619506836, -61.12065505981445, -59.63105010986328, -58.141448974609375, -56.65184783935547, -55.16224670410156, -53.67264938354492, -52.183048248291016, -50.69344711303711, -49.2038459777832, -47.71424865722656, -46.224647521972656, -44.73504638671875, -43.245445251464844, -41.7558479309082, -40.2662467956543, -38.77664566040039, -37.287044525146484, -35.79744338989258, -34.30784225463867, -32.818241119384766, -31.328641891479492, -29.839040756225586, -28.349441528320312, -26.859840393066406, -25.3702392578125, -23.880640029907227, -22.39103889465332, -20.901439666748047, -19.41183853149414, -17.922237396240234, -16.432636260986328, -14.943037033081055, -13.453435897827148, -11.963835716247559, -10.474235534667969, -8.984634399414062, -7.495034217834473, -6.005433559417725, -4.515832901000977, -3.0262327194213867, -1.5366315841674805, -0.047031402587890625, 1.4425691366195679, 2.9321696758270264, 4.421770095825195, 5.911370754241943, 7.400971412658691, 8.890571594238281, 10.380172729492188, 11.869772911071777]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 5.0, 7.0, 8.0, 11.0, 10.0, 12.0, 10.0, 18.0, 22.0, 13.0, 24.0, 31.0, 27.0, 28.0, 34.0, 25.0, 41.0, 43.0, 34.0, 48.0, 36.0, 35.0, 43.0, 38.0, 48.0, 48.0, 37.0, 28.0, 35.0, 26.0, 29.0, 20.0, 28.0, 17.0, 19.0, 20.0, 11.0, 3.0, 9.0, 5.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-62.3173828125, -60.645992279052734, -58.97460174560547, -57.30321502685547, -55.6318244934082, -53.96043395996094, -52.28904342651367, -50.617652893066406, -48.94626235961914, -47.274871826171875, -45.60348129272461, -43.932090759277344, -42.260704040527344, -40.58931350708008, -38.91792297363281, -37.24653244018555, -35.57514190673828, -33.903751373291016, -32.23236083984375, -30.560972213745117, -28.88958168029785, -27.21819305419922, -25.546802520751953, -23.875411987304688, -22.204025268554688, -20.532634735107422, -18.86124610900879, -17.189855575561523, -15.518465042114258, -13.847075462341309, -12.17568588256836, -10.504295349121094, -8.832904815673828, -7.161514759063721, -5.490124702453613, -3.818735122680664, -2.1473450660705566, -0.4759550094604492, 1.1954345703125, 2.8668251037597656, 4.538214683532715, 6.209604740142822, 7.88099479675293, 9.552384376525879, 11.223773956298828, 12.895164489746094, 14.566554069519043, 16.237945556640625, 17.909334182739258, 19.580724716186523, 21.252113342285156, 22.923503875732422, 24.594894409179688, 26.266284942626953, 27.937673568725586, 29.60906410217285, 31.280452728271484, 32.95184326171875, 34.623233795166016, 36.29462432861328, 37.96601104736328, 39.63740158081055, 41.30879211425781, 42.98018264770508, 44.651573181152344]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 4.0, 5.0, 7.0, 4.0, 4.0, 6.0, 10.0, 5.0, 11.0, 9.0, 13.0, 15.0, 22.0, 15.0, 15.0, 22.0, 30.0, 32.0, 29.0, 28.0, 26.0, 34.0, 37.0, 37.0, 47.0, 55.0, 52.0, 44.0, 38.0, 35.0, 45.0, 36.0, 37.0, 22.0, 17.0, 27.0, 19.0, 24.0, 19.0, 12.0, 5.0, 11.0, 6.0, 12.0, 6.0, 7.0, 2.0, 3.0, 5.0, 2.0, 3.0, 0.0, 4.0], "bins": [-7.7109375, -7.4979248046875, -7.284912109375, -7.0718994140625, -6.85888671875, -6.6458740234375, -6.432861328125, -6.2198486328125, -6.0068359375, -5.7938232421875, -5.580810546875, -5.3677978515625, -5.15478515625, -4.9417724609375, -4.728759765625, -4.5157470703125, -4.302734375, -4.0897216796875, -3.876708984375, -3.6636962890625, -3.45068359375, -3.2376708984375, -3.024658203125, -2.8116455078125, -2.5986328125, -2.3856201171875, -2.172607421875, -1.9595947265625, -1.74658203125, -1.5335693359375, -1.320556640625, -1.1075439453125, -0.89453125, -0.6815185546875, -0.468505859375, -0.2554931640625, -0.04248046875, 0.1705322265625, 0.383544921875, 0.5965576171875, 0.8095703125, 1.0225830078125, 1.235595703125, 1.4486083984375, 1.66162109375, 1.8746337890625, 2.087646484375, 2.3006591796875, 2.513671875, 2.7266845703125, 2.939697265625, 3.1527099609375, 3.36572265625, 3.5787353515625, 3.791748046875, 4.0047607421875, 4.2177734375, 4.4307861328125, 4.643798828125, 4.8568115234375, 5.06982421875, 5.2828369140625, 5.495849609375, 5.7088623046875, 5.921875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 2.0, 7.0, 8.0, 10.0, 11.0, 6.0, 9.0, 12.0, 21.0, 31.0, 22.0, 46.0, 48.0, 40.0, 49.0, 106.0, 153.0, 253.0, 474.0, 1362.0, 6861.0, 122801.0, 2996522.0, 1034420.0, 26184.0, 2949.0, 805.0, 351.0, 195.0, 142.0, 69.0, 72.0, 51.0, 27.0, 26.0, 23.0, 24.0, 19.0, 12.0, 14.0, 6.0, 9.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0, 0.0, 3.0, 1.0], "bins": [-24.828125, -24.134033203125, -23.43994140625, -22.745849609375, -22.0517578125, -21.357666015625, -20.66357421875, -19.969482421875, -19.275390625, -18.581298828125, -17.88720703125, -17.193115234375, -16.4990234375, -15.804931640625, -15.11083984375, -14.416748046875, -13.72265625, -13.028564453125, -12.33447265625, -11.640380859375, -10.9462890625, -10.252197265625, -9.55810546875, -8.864013671875, -8.169921875, -7.475830078125, -6.78173828125, -6.087646484375, -5.3935546875, -4.699462890625, -4.00537109375, -3.311279296875, -2.6171875, -1.923095703125, -1.22900390625, -0.534912109375, 0.1591796875, 0.853271484375, 1.54736328125, 2.241455078125, 2.935546875, 3.629638671875, 4.32373046875, 5.017822265625, 5.7119140625, 6.406005859375, 7.10009765625, 7.794189453125, 8.48828125, 9.182373046875, 9.87646484375, 10.570556640625, 11.2646484375, 11.958740234375, 12.65283203125, 13.346923828125, 14.041015625, 14.735107421875, 15.42919921875, 16.123291015625, 16.8173828125, 17.511474609375, 18.20556640625, 18.899658203125, 19.59375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 3.0, 6.0, 14.0, 15.0, 27.0, 30.0, 52.0, 58.0, 102.0, 153.0, 243.0, 333.0, 514.0, 566.0, 556.0, 432.0, 319.0, 196.0, 148.0, 102.0, 71.0, 46.0, 36.0, 24.0, 15.0, 10.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.625, -20.1441650390625, -19.663330078125, -19.1824951171875, -18.70166015625, -18.2208251953125, -17.739990234375, -17.2591552734375, -16.7783203125, -16.2974853515625, -15.816650390625, -15.3358154296875, -14.85498046875, -14.3741455078125, -13.893310546875, -13.4124755859375, -12.931640625, -12.4508056640625, -11.969970703125, -11.4891357421875, -11.00830078125, -10.5274658203125, -10.046630859375, -9.5657958984375, -9.0849609375, -8.6041259765625, -8.123291015625, -7.6424560546875, -7.16162109375, -6.6807861328125, -6.199951171875, -5.7191162109375, -5.23828125, -4.7574462890625, -4.276611328125, -3.7957763671875, -3.31494140625, -2.8341064453125, -2.353271484375, -1.8724365234375, -1.3916015625, -0.9107666015625, -0.429931640625, 0.0509033203125, 0.53173828125, 1.0125732421875, 1.493408203125, 1.9742431640625, 2.455078125, 2.9359130859375, 3.416748046875, 3.8975830078125, 4.37841796875, 4.8592529296875, 5.340087890625, 5.8209228515625, 6.3017578125, 6.7825927734375, 7.263427734375, 7.7442626953125, 8.22509765625, 8.7059326171875, 9.186767578125, 9.6676025390625, 10.1484375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 9.0, 14.0, 22.0, 24.0, 42.0, 60.0, 64.0, 107.0, 128.0, 199.0, 223.0, 350.0, 585.0, 2353.0, 953768.0, 3230447.0, 3913.0, 662.0, 399.0, 238.0, 200.0, 130.0, 82.0, 75.0, 58.0, 40.0, 39.0, 19.0, 5.0, 5.0, 9.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.0, -49.7470703125, -47.494140625, -45.2412109375, -42.98828125, -40.7353515625, -38.482421875, -36.2294921875, -33.9765625, -31.7236328125, -29.470703125, -27.2177734375, -24.96484375, -22.7119140625, -20.458984375, -18.2060546875, -15.953125, -13.7001953125, -11.447265625, -9.1943359375, -6.94140625, -4.6884765625, -2.435546875, -0.1826171875, 2.0703125, 4.3232421875, 6.576171875, 8.8291015625, 11.08203125, 13.3349609375, 15.587890625, 17.8408203125, 20.09375, 22.3466796875, 24.599609375, 26.8525390625, 29.10546875, 31.3583984375, 33.611328125, 35.8642578125, 38.1171875, 40.3701171875, 42.623046875, 44.8759765625, 47.12890625, 49.3818359375, 51.634765625, 53.8876953125, 56.140625, 58.3935546875, 60.646484375, 62.8994140625, 65.15234375, 67.4052734375, 69.658203125, 71.9111328125, 74.1640625, 76.4169921875, 78.669921875, 80.9228515625, 83.17578125, 85.4287109375, 87.681640625, 89.9345703125, 92.1875]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 22.0, 106.0, 291.0, 358.0, 180.0, 45.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.2844696044922, -231.57984924316406, -226.875244140625, -222.17062377929688, -217.46600341796875, -212.76138305664062, -208.0567626953125, -203.35215759277344, -198.6475372314453, -193.9429168701172, -189.23831176757812, -184.53369140625, -179.82907104492188, -175.12445068359375, -170.41983032226562, -165.71522521972656, -161.01060485839844, -156.3059844970703, -151.60137939453125, -146.89675903320312, -142.192138671875, -137.48751831054688, -132.78289794921875, -128.0782928466797, -123.37367248535156, -118.66905212402344, -113.96443939208984, -109.25982666015625, -104.55520629882812, -99.8505859375, -95.1459732055664, -90.44136047363281, -85.73675537109375, -81.03213500976562, -76.32752227783203, -71.62290954589844, -66.91828918457031, -62.21367263793945, -57.509056091308594, -52.804439544677734, -48.099822998046875, -43.395206451416016, -38.690589904785156, -33.9859733581543, -29.281356811523438, -24.576740264892578, -19.87212371826172, -15.16750717163086, -10.462890625, -5.758274078369141, -1.0536575317382812, 3.650959014892578, 8.355575561523438, 13.060192108154297, 17.764808654785156, 22.469425201416016, 27.174041748046875, 31.878658294677734, 36.583274841308594, 41.28789138793945, 45.99250793457031, 50.69712448120117, 55.40174102783203, 60.10635757446289, 64.81097412109375]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 4.0, 4.0, 11.0, 13.0, 9.0, 14.0, 25.0, 24.0, 23.0, 27.0, 21.0, 30.0, 32.0, 30.0, 39.0, 26.0, 35.0, 42.0, 44.0, 28.0, 48.0, 41.0, 25.0, 35.0, 35.0, 33.0, 43.0, 34.0, 32.0, 18.0, 28.0, 25.0, 25.0, 15.0, 17.0, 11.0, 6.0, 12.0, 7.0, 7.0, 6.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-37.430511474609375, -36.22124099731445, -35.0119743347168, -33.802703857421875, -32.59343338012695, -31.384164810180664, -30.174896240234375, -28.965625762939453, -27.75635528564453, -26.547086715698242, -25.33781623840332, -24.12854766845703, -22.91927719116211, -21.71000862121582, -20.50074005126953, -19.29146957397461, -18.08220100402832, -16.87293243408203, -15.66366195678711, -14.45439338684082, -13.245122909545898, -12.03585433959961, -10.826584815979004, -9.617315292358398, -8.408045768737793, -7.1987762451171875, -5.989506721496582, -4.780237674713135, -3.5709681510925293, -2.361698627471924, -1.1524295806884766, 0.056839942932128906, 1.2661094665527344, 2.47537899017334, 3.684648275375366, 4.893917560577393, 6.103187084197998, 7.3124566078186035, 8.52172565460205, 9.730995178222656, 10.940264701843262, 12.149534225463867, 13.358803749084473, 14.568073272705078, 15.777341842651367, 16.98661231994629, 18.195880889892578, 19.4051513671875, 20.61441993713379, 21.823688507080078, 23.032958984375, 24.24222755432129, 25.45149803161621, 26.6607666015625, 27.870037078857422, 29.07930564880371, 30.28857421875, 31.49784278869629, 32.70711135864258, 33.9163818359375, 35.12565231323242, 36.334922790527344, 37.544189453125, 38.75345993041992, 39.962730407714844]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 3.0, 9.0, 7.0, 11.0, 13.0, 8.0, 18.0, 9.0, 20.0, 14.0, 21.0, 21.0, 29.0, 22.0, 34.0, 24.0, 27.0, 33.0, 30.0, 34.0, 54.0, 32.0, 44.0, 51.0, 43.0, 32.0, 38.0, 30.0, 40.0, 19.0, 27.0, 24.0, 31.0, 22.0, 18.0, 19.0, 11.0, 16.0, 9.0, 13.0, 5.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0], "bins": [-7.25390625, -7.05108642578125, -6.8482666015625, -6.64544677734375, -6.442626953125, -6.23980712890625, -6.0369873046875, -5.83416748046875, -5.63134765625, -5.42852783203125, -5.2257080078125, -5.02288818359375, -4.820068359375, -4.61724853515625, -4.4144287109375, -4.21160888671875, -4.0087890625, -3.80596923828125, -3.6031494140625, -3.40032958984375, -3.197509765625, -2.99468994140625, -2.7918701171875, -2.58905029296875, -2.38623046875, -2.18341064453125, -1.9805908203125, -1.77777099609375, -1.574951171875, -1.37213134765625, -1.1693115234375, -0.96649169921875, -0.763671875, -0.56085205078125, -0.3580322265625, -0.15521240234375, 0.047607421875, 0.25042724609375, 0.4532470703125, 0.65606689453125, 0.85888671875, 1.06170654296875, 1.2645263671875, 1.46734619140625, 1.670166015625, 1.87298583984375, 2.0758056640625, 2.27862548828125, 2.4814453125, 2.68426513671875, 2.8870849609375, 3.08990478515625, 3.292724609375, 3.49554443359375, 3.6983642578125, 3.90118408203125, 4.10400390625, 4.30682373046875, 4.5096435546875, 4.71246337890625, 4.915283203125, 5.11810302734375, 5.3209228515625, 5.52374267578125, 5.7265625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 18.0, 16.0, 23.0, 40.0, 46.0, 92.0, 139.0, 208.0, 290.0, 412.0, 639.0, 892.0, 1261.0, 1860.0, 2713.0, 3886.0, 5862.0, 8830.0, 13484.0, 19979.0, 32015.0, 51522.0, 85472.0, 138261.0, 190852.0, 176218.0, 118043.0, 71942.0, 43937.0, 27087.0, 17426.0, 11271.0, 7647.0, 5136.0, 3493.0, 2324.0, 1636.0, 1133.0, 763.0, 555.0, 349.0, 247.0, 195.0, 119.0, 76.0, 51.0, 34.0, 22.0, 19.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.69287109375, -0.6703948974609375, -0.647918701171875, -0.6254425048828125, -0.60296630859375, -0.5804901123046875, -0.558013916015625, -0.5355377197265625, -0.5130615234375, -0.4905853271484375, -0.468109130859375, -0.4456329345703125, -0.42315673828125, -0.4006805419921875, -0.378204345703125, -0.3557281494140625, -0.333251953125, -0.3107757568359375, -0.288299560546875, -0.2658233642578125, -0.24334716796875, -0.2208709716796875, -0.198394775390625, -0.1759185791015625, -0.1534423828125, -0.1309661865234375, -0.108489990234375, -0.0860137939453125, -0.06353759765625, -0.0410614013671875, -0.018585205078125, 0.0038909912109375, 0.0263671875, 0.0488433837890625, 0.071319580078125, 0.0937957763671875, 0.11627197265625, 0.1387481689453125, 0.161224365234375, 0.1837005615234375, 0.2061767578125, 0.2286529541015625, 0.251129150390625, 0.2736053466796875, 0.29608154296875, 0.3185577392578125, 0.341033935546875, 0.3635101318359375, 0.385986328125, 0.4084625244140625, 0.430938720703125, 0.4534149169921875, 0.47589111328125, 0.4983673095703125, 0.520843505859375, 0.5433197021484375, 0.5657958984375, 0.5882720947265625, 0.610748291015625, 0.6332244873046875, 0.65570068359375, 0.6781768798828125, 0.700653076171875, 0.7231292724609375, 0.74560546875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 7.0, 1.0, 9.0, 9.0, 10.0, 9.0, 16.0, 13.0, 22.0, 34.0, 23.0, 20.0, 33.0, 32.0, 34.0, 40.0, 38.0, 34.0, 42.0, 40.0, 44.0, 1062.0, 45.0, 40.0, 30.0, 42.0, 35.0, 36.0, 27.0, 19.0, 28.0, 10.0, 25.0, 29.0, 17.0, 18.0, 9.0, 10.0, 8.0, 7.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.46484375, -4.32696533203125, -4.1890869140625, -4.05120849609375, -3.913330078125, -3.77545166015625, -3.6375732421875, -3.49969482421875, -3.36181640625, -3.22393798828125, -3.0860595703125, -2.94818115234375, -2.810302734375, -2.67242431640625, -2.5345458984375, -2.39666748046875, -2.2587890625, -2.12091064453125, -1.9830322265625, -1.84515380859375, -1.707275390625, -1.56939697265625, -1.4315185546875, -1.29364013671875, -1.15576171875, -1.01788330078125, -0.8800048828125, -0.74212646484375, -0.604248046875, -0.46636962890625, -0.3284912109375, -0.19061279296875, -0.052734375, 0.08514404296875, 0.2230224609375, 0.36090087890625, 0.498779296875, 0.63665771484375, 0.7745361328125, 0.91241455078125, 1.05029296875, 1.18817138671875, 1.3260498046875, 1.46392822265625, 1.601806640625, 1.73968505859375, 1.8775634765625, 2.01544189453125, 2.1533203125, 2.29119873046875, 2.4290771484375, 2.56695556640625, 2.704833984375, 2.84271240234375, 2.9805908203125, 3.11846923828125, 3.25634765625, 3.39422607421875, 3.5321044921875, 3.66998291015625, 3.807861328125, 3.94573974609375, 4.0836181640625, 4.22149658203125, 4.359375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 9.0, 10.0, 21.0, 26.0, 45.0, 69.0, 95.0, 157.0, 272.0, 439.0, 743.0, 1216.0, 2011.0, 3443.0, 5758.0, 9881.0, 17791.0, 31705.0, 59500.0, 116935.0, 212593.0, 1297193.0, 158630.0, 81826.0, 42537.0, 23153.0, 12822.0, 7354.0, 4372.0, 2595.0, 1558.0, 902.0, 606.0, 319.0, 210.0, 137.0, 62.0, 56.0, 24.0, 19.0, 12.0, 8.0, 9.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75, -0.7234344482421875, -0.696868896484375, -0.6703033447265625, -0.64373779296875, -0.6171722412109375, -0.590606689453125, -0.5640411376953125, -0.5374755859375, -0.5109100341796875, -0.484344482421875, -0.4577789306640625, -0.43121337890625, -0.4046478271484375, -0.378082275390625, -0.3515167236328125, -0.324951171875, -0.2983856201171875, -0.271820068359375, -0.2452545166015625, -0.21868896484375, -0.1921234130859375, -0.165557861328125, -0.1389923095703125, -0.1124267578125, -0.0858612060546875, -0.059295654296875, -0.0327301025390625, -0.00616455078125, 0.0204010009765625, 0.046966552734375, 0.0735321044921875, 0.10009765625, 0.1266632080078125, 0.153228759765625, 0.1797943115234375, 0.20635986328125, 0.2329254150390625, 0.259490966796875, 0.2860565185546875, 0.3126220703125, 0.3391876220703125, 0.365753173828125, 0.3923187255859375, 0.41888427734375, 0.4454498291015625, 0.472015380859375, 0.4985809326171875, 0.525146484375, 0.5517120361328125, 0.578277587890625, 0.6048431396484375, 0.63140869140625, 0.6579742431640625, 0.684539794921875, 0.7111053466796875, 0.7376708984375, 0.7642364501953125, 0.790802001953125, 0.8173675537109375, 0.84393310546875, 0.8704986572265625, 0.897064208984375, 0.9236297607421875, 0.9501953125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 1.0, 3.0, 2.0, 10.0, 8.0, 7.0, 23.0, 10.0, 17.0, 17.0, 33.0, 32.0, 40.0, 34.0, 42.0, 34.0, 43.0, 46.0, 37.0, 52.0, 53.0, 39.0, 43.0, 43.0, 28.0, 35.0, 32.0, 37.0, 19.0, 24.0, 25.0, 30.0, 19.0, 17.0, 15.0, 15.0, 10.0, 6.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00170135498046875, -0.001648634672164917, -0.001595914363861084, -0.001543194055557251, -0.001490473747253418, -0.001437753438949585, -0.001385033130645752, -0.001332312822341919, -0.001279592514038086, -0.001226872205734253, -0.00117415189743042, -0.001121431589126587, -0.001068711280822754, -0.001015990972518921, -0.0009632706642150879, -0.0009105503559112549, -0.0008578300476074219, -0.0008051097393035889, -0.0007523894309997559, -0.0006996691226959229, -0.0006469488143920898, -0.0005942285060882568, -0.0005415081977844238, -0.0004887878894805908, -0.0004360675811767578, -0.0003833472728729248, -0.0003306269645690918, -0.0002779066562652588, -0.00022518634796142578, -0.00017246603965759277, -0.00011974573135375977, -6.702542304992676e-05, -1.430511474609375e-05, 3.841519355773926e-05, 9.113550186157227e-05, 0.00014385581016540527, 0.00019657611846923828, 0.0002492964267730713, 0.0003020167350769043, 0.0003547370433807373, 0.0004074573516845703, 0.0004601776599884033, 0.0005128979682922363, 0.0005656182765960693, 0.0006183385848999023, 0.0006710588932037354, 0.0007237792015075684, 0.0007764995098114014, 0.0008292198181152344, 0.0008819401264190674, 0.0009346604347229004, 0.0009873807430267334, 0.0010401010513305664, 0.0010928213596343994, 0.0011455416679382324, 0.0011982619762420654, 0.0012509822845458984, 0.0013037025928497314, 0.0013564229011535645, 0.0014091432094573975, 0.0014618635177612305, 0.0015145838260650635, 0.0015673041343688965, 0.0016200244426727295, 0.0016727447509765625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 13.0, 17.0, 13.0, 28.0, 26.0, 32.0, 50.0, 50.0, 63.0, 68.0, 89.0, 151.0, 266.0, 631.0, 2617.0, 1005290.0, 37150.0, 911.0, 378.0, 154.0, 134.0, 82.0, 59.0, 55.0, 59.0, 31.0, 30.0, 16.0, 17.0, 13.0, 10.0, 10.0, 4.0, 6.0, 8.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0413818359375, -0.040116310119628906, -0.03885078430175781, -0.03758525848388672, -0.036319732666015625, -0.03505420684814453, -0.03378868103027344, -0.032523155212402344, -0.03125762939453125, -0.029992103576660156, -0.028726577758789062, -0.02746105194091797, -0.026195526123046875, -0.02493000030517578, -0.023664474487304688, -0.022398948669433594, -0.0211334228515625, -0.019867897033691406, -0.018602371215820312, -0.01733684539794922, -0.016071319580078125, -0.014805793762207031, -0.013540267944335938, -0.012274742126464844, -0.01100921630859375, -0.009743690490722656, -0.008478164672851562, -0.007212638854980469, -0.005947113037109375, -0.004681587219238281, -0.0034160614013671875, -0.0021505355834960938, -0.000885009765625, 0.00038051605224609375, 0.0016460418701171875, 0.0029115676879882812, 0.004177093505859375, 0.005442619323730469, 0.0067081451416015625, 0.007973670959472656, 0.00923919677734375, 0.010504722595214844, 0.011770248413085938, 0.013035774230957031, 0.014301300048828125, 0.015566825866699219, 0.016832351684570312, 0.018097877502441406, 0.0193634033203125, 0.020628929138183594, 0.021894454956054688, 0.02315998077392578, 0.024425506591796875, 0.02569103240966797, 0.026956558227539062, 0.028222084045410156, 0.02948760986328125, 0.030753135681152344, 0.03201866149902344, 0.03328418731689453, 0.034549713134765625, 0.03581523895263672, 0.03708076477050781, 0.038346290588378906, 0.03961181640625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 23.0, 429.0, 523.0, 42.0, 4.0], "bins": [-0.016269750893115997, -0.016003305092453957, -0.015736859291791916, -0.015470413491129875, -0.015203967690467834, -0.014937521889805794, -0.014671076089143753, -0.014404630288481712, -0.014138184487819672, -0.013871738687157631, -0.01360529288649559, -0.01333884708583355, -0.013072401285171509, -0.012805955484509468, -0.012539509683847427, -0.012273063883185387, -0.012006618082523346, -0.011740172281861305, -0.011473726481199265, -0.011207280680537224, -0.010940834879875183, -0.010674389079213142, -0.010407943278551102, -0.010141497477889061, -0.009875052608549595, -0.009608606807887554, -0.009342161007225513, -0.009075715206563473, -0.008809269405901432, -0.008542823605239391, -0.00827637780457735, -0.00800993200391531, -0.007743487134575844, -0.007477041333913803, -0.007210595533251762, -0.006944149732589722, -0.006677703931927681, -0.00641125813126564, -0.0061448123306035995, -0.005878366529941559, -0.005611920729279518, -0.005345474928617477, -0.005079029127955437, -0.004812583327293396, -0.004546137526631355, -0.004279691725969315, -0.004013245925307274, -0.003746800357475877, -0.0034803547896444798, -0.003213908988982439, -0.0029474631883203983, -0.0026810173876583576, -0.002414571586996317, -0.002148125786334276, -0.0018816802185028791, -0.0016152344178408384, -0.001348788500763476, -0.0010823427001014352, -0.0008158969576470554, -0.0005494512151926756, -0.0002830054145306349, -1.655961386859417e-05, 0.0002498860703781247, 0.0005163318710401654, 0.0007827776717022061]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 12.0, 13.0, 12.0, 14.0, 14.0, 19.0, 21.0, 21.0, 32.0, 28.0, 26.0, 36.0, 21.0, 40.0, 39.0, 50.0, 43.0, 30.0, 38.0, 43.0, 43.0, 46.0, 34.0, 38.0, 54.0, 31.0, 29.0, 30.0, 21.0, 18.0, 18.0, 18.0, 12.0, 14.0, 7.0, 9.0, 3.0, 10.0, 9.0, 5.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000904381275177002, -0.000872359611093998, -0.000840337947010994, -0.00080831628292799, -0.000776294618844986, -0.000744272954761982, -0.000712251290678978, -0.000680229626595974, -0.00064820796251297, -0.000616186298429966, -0.000584164634346962, -0.000552142970263958, -0.000520121306180954, -0.00048809964209795, -0.000456077978014946, -0.000424056313931942, -0.000392034649848938, -0.000360012985765934, -0.00032799132168293, -0.000295969657599926, -0.000263947993516922, -0.000231926329433918, -0.000199904665350914, -0.00016788300126791, -0.000135861337184906, -0.00010383967310190201, -7.181800901889801e-05, -3.979634493589401e-05, -7.774680852890015e-06, 2.4246983230113983e-05, 5.626864731311798e-05, 8.829031139612198e-05, 0.00012031197547912598, 0.00015233363956212997, 0.00018435530364513397, 0.00021637696772813797, 0.00024839863181114197, 0.00028042029589414597, 0.00031244195997714996, 0.00034446362406015396, 0.00037648528814315796, 0.00040850695222616196, 0.00044052861630916595, 0.00047255028039216995, 0.000504571944475174, 0.000536593608558178, 0.000568615272641182, 0.0006006369367241859, 0.0006326586008071899, 0.0006646802648901939, 0.0006967019289731979, 0.0007287235930562019, 0.0007607452571392059, 0.0007927669212222099, 0.0008247885853052139, 0.0008568102493882179, 0.0008888319134712219, 0.0009208535775542259, 0.0009528752416372299, 0.000984896905720234, 0.001016918569803238, 0.001048940233886242, 0.001080961897969246, 0.00111298356205225, 0.001145005226135254]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 6.0, 3.0, 9.0, 7.0, 11.0, 13.0, 8.0, 18.0, 9.0, 20.0, 14.0, 21.0, 21.0, 29.0, 22.0, 34.0, 24.0, 27.0, 33.0, 30.0, 34.0, 54.0, 31.0, 45.0, 51.0, 43.0, 31.0, 39.0, 30.0, 40.0, 19.0, 27.0, 24.0, 31.0, 22.0, 18.0, 19.0, 11.0, 16.0, 9.0, 13.0, 5.0, 6.0, 4.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0], "bins": [-7.25390625, -7.05108642578125, -6.8482666015625, -6.64544677734375, -6.442626953125, -6.23980712890625, -6.0369873046875, -5.83416748046875, -5.63134765625, -5.42852783203125, -5.2257080078125, -5.02288818359375, -4.820068359375, -4.61724853515625, -4.4144287109375, -4.21160888671875, -4.0087890625, -3.80596923828125, -3.6031494140625, -3.40032958984375, -3.197509765625, -2.99468994140625, -2.7918701171875, -2.58905029296875, -2.38623046875, -2.18341064453125, -1.9805908203125, -1.77777099609375, -1.574951171875, -1.37213134765625, -1.1693115234375, -0.96649169921875, -0.763671875, -0.56085205078125, -0.3580322265625, -0.15521240234375, 0.047607421875, 0.25042724609375, 0.4532470703125, 0.65606689453125, 0.85888671875, 1.06170654296875, 1.2645263671875, 1.46734619140625, 1.670166015625, 1.87298583984375, 2.0758056640625, 2.27862548828125, 2.4814453125, 2.68426513671875, 2.8870849609375, 3.08990478515625, 3.292724609375, 3.49554443359375, 3.6983642578125, 3.90118408203125, 4.10400390625, 4.30682373046875, 4.5096435546875, 4.71246337890625, 4.915283203125, 5.11810302734375, 5.3209228515625, 5.52374267578125, 5.7265625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 3.0, 8.0, 11.0, 18.0, 17.0, 17.0, 31.0, 20.0, 39.0, 49.0, 65.0, 86.0, 138.0, 163.0, 288.0, 550.0, 828.0, 1801.0, 4558.0, 16828.0, 85367.0, 672959.0, 217089.0, 34032.0, 7896.0, 2633.0, 1172.0, 647.0, 400.0, 235.0, 144.0, 100.0, 84.0, 70.0, 41.0, 30.0, 29.0, 28.0, 17.0, 16.0, 8.0, 7.0, 3.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0], "bins": [-13.359375, -12.9854736328125, -12.611572265625, -12.2376708984375, -11.86376953125, -11.4898681640625, -11.115966796875, -10.7420654296875, -10.3681640625, -9.9942626953125, -9.620361328125, -9.2464599609375, -8.87255859375, -8.4986572265625, -8.124755859375, -7.7508544921875, -7.376953125, -7.0030517578125, -6.629150390625, -6.2552490234375, -5.88134765625, -5.5074462890625, -5.133544921875, -4.7596435546875, -4.3857421875, -4.0118408203125, -3.637939453125, -3.2640380859375, -2.89013671875, -2.5162353515625, -2.142333984375, -1.7684326171875, -1.39453125, -1.0206298828125, -0.646728515625, -0.2728271484375, 0.10107421875, 0.4749755859375, 0.848876953125, 1.2227783203125, 1.5966796875, 1.9705810546875, 2.344482421875, 2.7183837890625, 3.09228515625, 3.4661865234375, 3.840087890625, 4.2139892578125, 4.587890625, 4.9617919921875, 5.335693359375, 5.7095947265625, 6.08349609375, 6.4573974609375, 6.831298828125, 7.2052001953125, 7.5791015625, 7.9530029296875, 8.326904296875, 8.7008056640625, 9.07470703125, 9.4486083984375, 9.822509765625, 10.1964111328125, 10.5703125]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 6.0, 6.0, 7.0, 12.0, 16.0, 23.0, 36.0, 29.0, 26.0, 49.0, 52.0, 58.0, 62.0, 90.0, 390.0, 1674.0, 90.0, 71.0, 46.0, 53.0, 51.0, 37.0, 38.0, 30.0, 19.0, 20.0, 12.0, 12.0, 11.0, 3.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.09375, -27.12646484375, -26.1591796875, -25.19189453125, -24.224609375, -23.25732421875, -22.2900390625, -21.32275390625, -20.35546875, -19.38818359375, -18.4208984375, -17.45361328125, -16.486328125, -15.51904296875, -14.5517578125, -13.58447265625, -12.6171875, -11.64990234375, -10.6826171875, -9.71533203125, -8.748046875, -7.78076171875, -6.8134765625, -5.84619140625, -4.87890625, -3.91162109375, -2.9443359375, -1.97705078125, -1.009765625, -0.04248046875, 0.9248046875, 1.89208984375, 2.859375, 3.82666015625, 4.7939453125, 5.76123046875, 6.728515625, 7.69580078125, 8.6630859375, 9.63037109375, 10.59765625, 11.56494140625, 12.5322265625, 13.49951171875, 14.466796875, 15.43408203125, 16.4013671875, 17.36865234375, 18.3359375, 19.30322265625, 20.2705078125, 21.23779296875, 22.205078125, 23.17236328125, 24.1396484375, 25.10693359375, 26.07421875, 27.04150390625, 28.0087890625, 28.97607421875, 29.943359375, 30.91064453125, 31.8779296875, 32.84521484375, 33.8125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 8.0, 4.0, 5.0, 7.0, 13.0, 13.0, 13.0, 30.0, 17.0, 44.0, 46.0, 55.0, 72.0, 112.0, 183.0, 415.0, 2256.0, 2599333.0, 540258.0, 1860.0, 399.0, 167.0, 100.0, 72.0, 40.0, 43.0, 35.0, 33.0, 20.0, 15.0, 12.0, 7.0, 7.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-100.6875, -97.8876953125, -95.087890625, -92.2880859375, -89.48828125, -86.6884765625, -83.888671875, -81.0888671875, -78.2890625, -75.4892578125, -72.689453125, -69.8896484375, -67.08984375, -64.2900390625, -61.490234375, -58.6904296875, -55.890625, -53.0908203125, -50.291015625, -47.4912109375, -44.69140625, -41.8916015625, -39.091796875, -36.2919921875, -33.4921875, -30.6923828125, -27.892578125, -25.0927734375, -22.29296875, -19.4931640625, -16.693359375, -13.8935546875, -11.09375, -8.2939453125, -5.494140625, -2.6943359375, 0.10546875, 2.9052734375, 5.705078125, 8.5048828125, 11.3046875, 14.1044921875, 16.904296875, 19.7041015625, 22.50390625, 25.3037109375, 28.103515625, 30.9033203125, 33.703125, 36.5029296875, 39.302734375, 42.1025390625, 44.90234375, 47.7021484375, 50.501953125, 53.3017578125, 56.1015625, 58.9013671875, 61.701171875, 64.5009765625, 67.30078125, 70.1005859375, 72.900390625, 75.7001953125, 78.5]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 7.0, 4.0, 23.0, 41.0, 98.0, 144.0, 207.0, 206.0, 129.0, 97.0, 26.0, 16.0, 12.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.785439491271973, -11.619653701782227, -10.453866958618164, -9.288081169128418, -8.122295379638672, -6.956509590148926, -5.7907233238220215, -4.624937057495117, -3.459151268005371, -2.293365240097046, -1.1275792121887207, 0.03820681571960449, 1.2039928436279297, 2.369778633117676, 3.53556489944458, 4.701351165771484, 5.8671369552612305, 7.032922744750977, 8.198709487915039, 9.364495277404785, 10.530281066894531, 11.696066856384277, 12.861852645874023, 14.027639389038086, 15.193425178527832, 16.359210968017578, 17.52499771118164, 18.69078254699707, 19.856569290161133, 21.022354125976562, 22.188140869140625, 23.353927612304688, 24.51971435546875, 25.685501098632812, 26.851285934448242, 28.017072677612305, 29.182857513427734, 30.348644256591797, 31.51443099975586, 32.68021774291992, 33.84600067138672, 35.01178741455078, 36.177574157714844, 37.34335708618164, 38.5091438293457, 39.674930572509766, 40.84071731567383, 42.00650405883789, 43.17229080200195, 44.338077545166016, 45.50386428833008, 46.669647216796875, 47.83543395996094, 49.001220703125, 50.16700744628906, 51.332794189453125, 52.49858093261719, 53.66436767578125, 54.83015441894531, 55.99593734741211, 57.16172409057617, 58.327510833740234, 59.4932975769043, 60.65908432006836, 61.824867248535156]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 6.0, 7.0, 5.0, 9.0, 6.0, 23.0, 19.0, 22.0, 27.0, 30.0, 29.0, 32.0, 33.0, 37.0, 36.0, 44.0, 47.0, 45.0, 43.0, 46.0, 33.0, 38.0, 35.0, 45.0, 34.0, 40.0, 28.0, 32.0, 32.0, 17.0, 22.0, 21.0, 13.0, 9.0, 15.0, 7.0, 10.0, 11.0, 2.0, 3.0, 5.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.90577697753906, -68.70343780517578, -66.5010986328125, -64.29875946044922, -62.09642028808594, -59.894081115722656, -57.69174575805664, -55.48940658569336, -53.28706741333008, -51.0847282409668, -48.882389068603516, -46.680049896240234, -44.47771453857422, -42.27537536621094, -40.073036193847656, -37.870697021484375, -35.668357849121094, -33.46601867675781, -31.26367950439453, -29.061342239379883, -26.8590030670166, -24.65666389465332, -22.454326629638672, -20.25198745727539, -18.04964828491211, -15.847309112548828, -13.644970893859863, -11.442632675170898, -9.240293502807617, -7.037954330444336, -4.835616111755371, -2.6332778930664062, -0.430938720703125, 1.771399974822998, 3.973738670349121, 6.176077365875244, 8.378416061401367, 10.580755233764648, 12.783093452453613, 14.985431671142578, 17.18777084350586, 19.39011001586914, 21.592449188232422, 23.79478645324707, 25.99712562561035, 28.199464797973633, 30.40180206298828, 32.60414123535156, 34.806480407714844, 37.008819580078125, 39.211158752441406, 41.41349792480469, 43.61583709716797, 45.81817626953125, 48.020511627197266, 50.22285079956055, 52.42518997192383, 54.62752914428711, 56.82986831665039, 59.03220748901367, 61.23454284667969, 63.43688201904297, 65.63922119140625, 67.84156036376953, 70.04389953613281]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 3.0, 1.0, 10.0, 5.0, 12.0, 7.0, 15.0, 6.0, 13.0, 13.0, 15.0, 21.0, 17.0, 21.0, 22.0, 20.0, 27.0, 29.0, 35.0, 33.0, 28.0, 29.0, 42.0, 49.0, 37.0, 31.0, 34.0, 47.0, 38.0, 42.0, 39.0, 28.0, 36.0, 33.0, 22.0, 28.0, 16.0, 12.0, 14.0, 13.0, 8.0, 9.0, 10.0, 11.0, 5.0, 5.0, 1.0, 4.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0], "bins": [-7.5, -7.28131103515625, -7.0626220703125, -6.84393310546875, -6.625244140625, -6.40655517578125, -6.1878662109375, -5.96917724609375, -5.75048828125, -5.53179931640625, -5.3131103515625, -5.09442138671875, -4.875732421875, -4.65704345703125, -4.4383544921875, -4.21966552734375, -4.0009765625, -3.78228759765625, -3.5635986328125, -3.34490966796875, -3.126220703125, -2.90753173828125, -2.6888427734375, -2.47015380859375, -2.25146484375, -2.03277587890625, -1.8140869140625, -1.59539794921875, -1.376708984375, -1.15802001953125, -0.9393310546875, -0.72064208984375, -0.501953125, -0.28326416015625, -0.0645751953125, 0.15411376953125, 0.372802734375, 0.59149169921875, 0.8101806640625, 1.02886962890625, 1.24755859375, 1.46624755859375, 1.6849365234375, 1.90362548828125, 2.122314453125, 2.34100341796875, 2.5596923828125, 2.77838134765625, 2.9970703125, 3.21575927734375, 3.4344482421875, 3.65313720703125, 3.871826171875, 4.09051513671875, 4.3092041015625, 4.52789306640625, 4.74658203125, 4.96527099609375, 5.1839599609375, 5.40264892578125, 5.621337890625, 5.84002685546875, 6.0587158203125, 6.27740478515625, 6.49609375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 5.0, 8.0, 7.0, 14.0, 12.0, 13.0, 29.0, 20.0, 29.0, 40.0, 50.0, 61.0, 101.0, 184.0, 237.0, 354.0, 631.0, 1209.0, 2352.0, 5265.0, 14985.0, 56914.0, 259665.0, 933617.0, 1599428.0, 950825.0, 279668.0, 61597.0, 15869.0, 5622.0, 2329.0, 1240.0, 682.0, 379.0, 250.0, 169.0, 116.0, 79.0, 44.0, 36.0, 34.0, 18.0, 22.0, 12.0, 16.0, 11.0, 6.0, 8.0, 6.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-8.6875, -8.411865234375, -8.13623046875, -7.860595703125, -7.5849609375, -7.309326171875, -7.03369140625, -6.758056640625, -6.482421875, -6.206787109375, -5.93115234375, -5.655517578125, -5.3798828125, -5.104248046875, -4.82861328125, -4.552978515625, -4.27734375, -4.001708984375, -3.72607421875, -3.450439453125, -3.1748046875, -2.899169921875, -2.62353515625, -2.347900390625, -2.072265625, -1.796630859375, -1.52099609375, -1.245361328125, -0.9697265625, -0.694091796875, -0.41845703125, -0.142822265625, 0.1328125, 0.408447265625, 0.68408203125, 0.959716796875, 1.2353515625, 1.510986328125, 1.78662109375, 2.062255859375, 2.337890625, 2.613525390625, 2.88916015625, 3.164794921875, 3.4404296875, 3.716064453125, 3.99169921875, 4.267333984375, 4.54296875, 4.818603515625, 5.09423828125, 5.369873046875, 5.6455078125, 5.921142578125, 6.19677734375, 6.472412109375, 6.748046875, 7.023681640625, 7.29931640625, 7.574951171875, 7.8505859375, 8.126220703125, 8.40185546875, 8.677490234375, 8.953125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 8.0, 8.0, 14.0, 20.0, 24.0, 35.0, 27.0, 50.0, 78.0, 110.0, 162.0, 206.0, 252.0, 350.0, 413.0, 429.0, 437.0, 346.0, 297.0, 204.0, 181.0, 105.0, 94.0, 64.0, 45.0, 27.0, 23.0, 17.0, 16.0, 7.0, 9.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.2265625, -9.7933349609375, -9.360107421875, -8.9268798828125, -8.49365234375, -8.0604248046875, -7.627197265625, -7.1939697265625, -6.7607421875, -6.3275146484375, -5.894287109375, -5.4610595703125, -5.02783203125, -4.5946044921875, -4.161376953125, -3.7281494140625, -3.294921875, -2.8616943359375, -2.428466796875, -1.9952392578125, -1.56201171875, -1.1287841796875, -0.695556640625, -0.2623291015625, 0.1708984375, 0.6041259765625, 1.037353515625, 1.4705810546875, 1.90380859375, 2.3370361328125, 2.770263671875, 3.2034912109375, 3.63671875, 4.0699462890625, 4.503173828125, 4.9364013671875, 5.36962890625, 5.8028564453125, 6.236083984375, 6.6693115234375, 7.1025390625, 7.5357666015625, 7.968994140625, 8.4022216796875, 8.83544921875, 9.2686767578125, 9.701904296875, 10.1351318359375, 10.568359375, 11.0015869140625, 11.434814453125, 11.8680419921875, 12.30126953125, 12.7344970703125, 13.167724609375, 13.6009521484375, 14.0341796875, 14.4674072265625, 14.900634765625, 15.3338623046875, 15.76708984375, 16.2003173828125, 16.633544921875, 17.0667724609375, 17.5]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 10.0, 14.0, 7.0, 12.0, 25.0, 35.0, 44.0, 45.0, 80.0, 90.0, 126.0, 172.0, 221.0, 290.0, 393.0, 760.0, 2625.0, 61210.0, 3954145.0, 167280.0, 4077.0, 903.0, 459.0, 331.0, 193.0, 189.0, 120.0, 106.0, 78.0, 66.0, 54.0, 40.0, 26.0, 16.0, 10.0, 10.0, 9.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 3.0], "bins": [-60.6875, -59.115234375, -57.54296875, -55.970703125, -54.3984375, -52.826171875, -51.25390625, -49.681640625, -48.109375, -46.537109375, -44.96484375, -43.392578125, -41.8203125, -40.248046875, -38.67578125, -37.103515625, -35.53125, -33.958984375, -32.38671875, -30.814453125, -29.2421875, -27.669921875, -26.09765625, -24.525390625, -22.953125, -21.380859375, -19.80859375, -18.236328125, -16.6640625, -15.091796875, -13.51953125, -11.947265625, -10.375, -8.802734375, -7.23046875, -5.658203125, -4.0859375, -2.513671875, -0.94140625, 0.630859375, 2.203125, 3.775390625, 5.34765625, 6.919921875, 8.4921875, 10.064453125, 11.63671875, 13.208984375, 14.78125, 16.353515625, 17.92578125, 19.498046875, 21.0703125, 22.642578125, 24.21484375, 25.787109375, 27.359375, 28.931640625, 30.50390625, 32.076171875, 33.6484375, 35.220703125, 36.79296875, 38.365234375, 39.9375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 7.0, 226.0, 688.0, 94.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-318.06634521484375, -306.83941650390625, -295.6125183105469, -284.3855895996094, -273.1586608886719, -261.9317626953125, -250.704833984375, -239.47792053222656, -228.25100708007812, -217.0240936279297, -205.7971649169922, -194.57025146484375, -183.3433380126953, -172.11642456054688, -160.88949584960938, -149.66258239746094, -138.43565368652344, -127.20873260498047, -115.98181915283203, -104.75489807128906, -93.52798461914062, -82.30106353759766, -71.07414245605469, -59.84722900390625, -48.62030792236328, -37.39339065551758, -26.166471481323242, -14.939552307128906, -3.712635040283203, 7.5142822265625, 18.74120330810547, 29.968116760253906, 41.195037841796875, 52.42195510864258, 63.64887237548828, 74.87579345703125, 86.10270690917969, 97.32962799072266, 108.55654907226562, 119.78346252441406, 131.0103759765625, 142.23728942871094, 153.46421813964844, 164.69113159179688, 175.9180450439453, 187.14495849609375, 198.37188720703125, 209.5988006591797, 220.8257293701172, 232.05264282226562, 243.27957153320312, 254.50648498535156, 265.7333984375, 276.9603271484375, 288.187255859375, 299.4141540527344, 310.6410827636719, 321.8680114746094, 333.09490966796875, 344.32183837890625, 355.54876708984375, 366.7756652832031, 378.0025939941406, 389.2294921875, 400.4564208984375]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 7.0, 3.0, 4.0, 9.0, 16.0, 10.0, 15.0, 17.0, 17.0, 23.0, 22.0, 15.0, 24.0, 25.0, 38.0, 36.0, 36.0, 38.0, 42.0, 42.0, 35.0, 39.0, 33.0, 45.0, 27.0, 32.0, 35.0, 32.0, 41.0, 29.0, 24.0, 28.0, 24.0, 19.0, 15.0, 22.0, 13.0, 8.0, 9.0, 11.0, 13.0, 8.0, 2.0, 5.0, 6.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-39.73283386230469, -38.46401596069336, -37.19519805908203, -35.92638397216797, -34.65756607055664, -33.38874816894531, -32.119930267333984, -30.851112365722656, -29.58229637145996, -28.313478469848633, -27.044662475585938, -25.77584457397461, -24.50702667236328, -23.238210678100586, -21.969392776489258, -20.700576782226562, -19.431758880615234, -18.162940979003906, -16.89412498474121, -15.625307083129883, -14.356490135192871, -13.08767318725586, -11.818855285644531, -10.55003833770752, -9.281221389770508, -8.012404441833496, -6.743587017059326, -5.474769592285156, -4.2059526443481445, -2.937135696411133, -1.668318271636963, -0.39950084686279297, 0.8693161010742188, 2.1381332874298096, 3.4069504737854004, 4.67576789855957, 5.944584846496582, 7.213401794433594, 8.482219696044922, 9.751036643981934, 11.019853591918945, 12.288670539855957, 13.557487487792969, 14.826305389404297, 16.095123291015625, 17.36393928527832, 18.63275718688965, 19.901573181152344, 21.170391082763672, 22.439208984375, 23.708024978637695, 24.976842880249023, 26.24565887451172, 27.514476776123047, 28.783294677734375, 30.052112579345703, 31.3209285736084, 32.589744567871094, 33.85856246948242, 35.12738037109375, 36.39619827270508, 37.665016174316406, 38.93383026123047, 40.2026481628418, 41.471466064453125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 4.0, 8.0, 7.0, 7.0, 12.0, 13.0, 10.0, 11.0, 15.0, 23.0, 21.0, 17.0, 19.0, 26.0, 40.0, 30.0, 28.0, 26.0, 34.0, 32.0, 34.0, 36.0, 40.0, 49.0, 37.0, 39.0, 43.0, 41.0, 33.0, 37.0, 20.0, 30.0, 23.0, 18.0, 21.0, 18.0, 16.0, 13.0, 13.0, 8.0, 7.0, 9.0, 7.0, 2.0, 5.0, 4.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0], "bins": [-7.21875, -7.0072021484375, -6.795654296875, -6.5841064453125, -6.37255859375, -6.1610107421875, -5.949462890625, -5.7379150390625, -5.5263671875, -5.3148193359375, -5.103271484375, -4.8917236328125, -4.68017578125, -4.4686279296875, -4.257080078125, -4.0455322265625, -3.833984375, -3.6224365234375, -3.410888671875, -3.1993408203125, -2.98779296875, -2.7762451171875, -2.564697265625, -2.3531494140625, -2.1416015625, -1.9300537109375, -1.718505859375, -1.5069580078125, -1.29541015625, -1.0838623046875, -0.872314453125, -0.6607666015625, -0.44921875, -0.2376708984375, -0.026123046875, 0.1854248046875, 0.39697265625, 0.6085205078125, 0.820068359375, 1.0316162109375, 1.2431640625, 1.4547119140625, 1.666259765625, 1.8778076171875, 2.08935546875, 2.3009033203125, 2.512451171875, 2.7239990234375, 2.935546875, 3.1470947265625, 3.358642578125, 3.5701904296875, 3.78173828125, 3.9932861328125, 4.204833984375, 4.4163818359375, 4.6279296875, 4.8394775390625, 5.051025390625, 5.2625732421875, 5.47412109375, 5.6856689453125, 5.897216796875, 6.1087646484375, 6.3203125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 5.0, 8.0, 14.0, 18.0, 31.0, 54.0, 84.0, 113.0, 183.0, 281.0, 439.0, 728.0, 1058.0, 1618.0, 2530.0, 4039.0, 6063.0, 9943.0, 15910.0, 25721.0, 43742.0, 77367.0, 138135.0, 213022.0, 204121.0, 127321.0, 71008.0, 40782.0, 23849.0, 14762.0, 9201.0, 5879.0, 3703.0, 2430.0, 1562.0, 1040.0, 625.0, 429.0, 263.0, 157.0, 110.0, 85.0, 48.0, 31.0, 16.0, 14.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.82470703125, -0.7980422973632812, -0.7713775634765625, -0.7447128295898438, -0.718048095703125, -0.6913833618164062, -0.6647186279296875, -0.6380538940429688, -0.61138916015625, -0.5847244262695312, -0.5580596923828125, -0.5313949584960938, -0.504730224609375, -0.47806549072265625, -0.4514007568359375, -0.42473602294921875, -0.3980712890625, -0.37140655517578125, -0.3447418212890625, -0.31807708740234375, -0.291412353515625, -0.26474761962890625, -0.2380828857421875, -0.21141815185546875, -0.18475341796875, -0.15808868408203125, -0.1314239501953125, -0.10475921630859375, -0.078094482421875, -0.05142974853515625, -0.0247650146484375, 0.00189971923828125, 0.028564453125, 0.05522918701171875, 0.0818939208984375, 0.10855865478515625, 0.135223388671875, 0.16188812255859375, 0.1885528564453125, 0.21521759033203125, 0.24188232421875, 0.26854705810546875, 0.2952117919921875, 0.32187652587890625, 0.348541259765625, 0.37520599365234375, 0.4018707275390625, 0.42853546142578125, 0.4552001953125, 0.48186492919921875, 0.5085296630859375, 0.5351943969726562, 0.561859130859375, 0.5885238647460938, 0.6151885986328125, 0.6418533325195312, 0.66851806640625, 0.6951828002929688, 0.7218475341796875, 0.7485122680664062, 0.775177001953125, 0.8018417358398438, 0.8285064697265625, 0.8551712036132812, 0.8818359375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 5.0, 4.0, 4.0, 9.0, 7.0, 10.0, 14.0, 9.0, 14.0, 20.0, 18.0, 16.0, 22.0, 22.0, 28.0, 37.0, 30.0, 28.0, 35.0, 39.0, 42.0, 34.0, 35.0, 1065.0, 28.0, 34.0, 38.0, 38.0, 39.0, 28.0, 39.0, 36.0, 27.0, 28.0, 26.0, 33.0, 15.0, 12.0, 9.0, 7.0, 12.0, 7.0, 4.0, 10.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-4.515625, -4.37481689453125, -4.2340087890625, -4.09320068359375, -3.952392578125, -3.81158447265625, -3.6707763671875, -3.52996826171875, -3.38916015625, -3.24835205078125, -3.1075439453125, -2.96673583984375, -2.825927734375, -2.68511962890625, -2.5443115234375, -2.40350341796875, -2.2626953125, -2.12188720703125, -1.9810791015625, -1.84027099609375, -1.699462890625, -1.55865478515625, -1.4178466796875, -1.27703857421875, -1.13623046875, -0.99542236328125, -0.8546142578125, -0.71380615234375, -0.572998046875, -0.43218994140625, -0.2913818359375, -0.15057373046875, -0.009765625, 0.13104248046875, 0.2718505859375, 0.41265869140625, 0.553466796875, 0.69427490234375, 0.8350830078125, 0.97589111328125, 1.11669921875, 1.25750732421875, 1.3983154296875, 1.53912353515625, 1.679931640625, 1.82073974609375, 1.9615478515625, 2.10235595703125, 2.2431640625, 2.38397216796875, 2.5247802734375, 2.66558837890625, 2.806396484375, 2.94720458984375, 3.0880126953125, 3.22882080078125, 3.36962890625, 3.51043701171875, 3.6512451171875, 3.79205322265625, 3.932861328125, 4.07366943359375, 4.2144775390625, 4.35528564453125, 4.49609375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 7.0, 6.0, 15.0, 20.0, 34.0, 40.0, 82.0, 125.0, 175.0, 302.0, 528.0, 892.0, 1488.0, 2620.0, 4558.0, 7957.0, 14624.0, 26582.0, 50689.0, 98703.0, 185876.0, 1304897.0, 186720.0, 98906.0, 50705.0, 26997.0, 14481.0, 8033.0, 4550.0, 2721.0, 1522.0, 890.0, 524.0, 317.0, 203.0, 118.0, 75.0, 61.0, 40.0, 14.0, 12.0, 9.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.88671875, -0.8576507568359375, -0.828582763671875, -0.7995147705078125, -0.77044677734375, -0.7413787841796875, -0.712310791015625, -0.6832427978515625, -0.6541748046875, -0.6251068115234375, -0.596038818359375, -0.5669708251953125, -0.53790283203125, -0.5088348388671875, -0.479766845703125, -0.4506988525390625, -0.421630859375, -0.3925628662109375, -0.363494873046875, -0.3344268798828125, -0.30535888671875, -0.2762908935546875, -0.247222900390625, -0.2181549072265625, -0.1890869140625, -0.1600189208984375, -0.130950927734375, -0.1018829345703125, -0.07281494140625, -0.0437469482421875, -0.014678955078125, 0.0143890380859375, 0.04345703125, 0.0725250244140625, 0.101593017578125, 0.1306610107421875, 0.15972900390625, 0.1887969970703125, 0.217864990234375, 0.2469329833984375, 0.2760009765625, 0.3050689697265625, 0.334136962890625, 0.3632049560546875, 0.39227294921875, 0.4213409423828125, 0.450408935546875, 0.4794769287109375, 0.508544921875, 0.5376129150390625, 0.566680908203125, 0.5957489013671875, 0.62481689453125, 0.6538848876953125, 0.682952880859375, 0.7120208740234375, 0.7410888671875, 0.7701568603515625, 0.799224853515625, 0.8282928466796875, 0.85736083984375, 0.8864288330078125, 0.915496826171875, 0.9445648193359375, 0.9736328125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 2.0, 6.0, 3.0, 4.0, 8.0, 5.0, 10.0, 18.0, 14.0, 19.0, 25.0, 32.0, 24.0, 39.0, 39.0, 42.0, 40.0, 54.0, 54.0, 53.0, 48.0, 51.0, 44.0, 34.0, 55.0, 50.0, 33.0, 40.0, 27.0, 25.0, 27.0, 21.0, 11.0, 5.0, 10.0, 11.0, 9.0, 2.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002048492431640625, -0.001981496810913086, -0.0019145011901855469, -0.0018475055694580078, -0.0017805099487304688, -0.0017135143280029297, -0.0016465187072753906, -0.0015795230865478516, -0.0015125274658203125, -0.0014455318450927734, -0.0013785362243652344, -0.0013115406036376953, -0.0012445449829101562, -0.0011775493621826172, -0.0011105537414550781, -0.001043558120727539, -0.0009765625, -0.0009095668792724609, -0.0008425712585449219, -0.0007755756378173828, -0.0007085800170898438, -0.0006415843963623047, -0.0005745887756347656, -0.0005075931549072266, -0.0004405975341796875, -0.00037360191345214844, -0.0003066062927246094, -0.0002396106719970703, -0.00017261505126953125, -0.00010561943054199219, -3.8623809814453125e-05, 2.8371810913085938e-05, 9.5367431640625e-05, 0.00016236305236816406, 0.00022935867309570312, 0.0002963542938232422, 0.00036334991455078125, 0.0004303455352783203, 0.0004973411560058594, 0.0005643367767333984, 0.0006313323974609375, 0.0006983280181884766, 0.0007653236389160156, 0.0008323192596435547, 0.0008993148803710938, 0.0009663105010986328, 0.0010333061218261719, 0.001100301742553711, 0.00116729736328125, 0.001234292984008789, 0.0013012886047363281, 0.0013682842254638672, 0.0014352798461914062, 0.0015022754669189453, 0.0015692710876464844, 0.0016362667083740234, 0.0017032623291015625, 0.0017702579498291016, 0.0018372535705566406, 0.0019042491912841797, 0.0019712448120117188, 0.002038240432739258, 0.002105236053466797, 0.002172231674194336, 0.002239227294921875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 6.0, 6.0, 5.0, 8.0, 5.0, 9.0, 14.0, 27.0, 13.0, 25.0, 32.0, 60.0, 75.0, 88.0, 104.0, 160.0, 342.0, 855.0, 22032.0, 1021302.0, 1975.0, 584.0, 239.0, 153.0, 99.0, 82.0, 60.0, 43.0, 35.0, 33.0, 24.0, 17.0, 9.0, 17.0, 3.0, 4.0, 8.0, 6.0, 3.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04931640625, -0.04774045944213867, -0.046164512634277344, -0.044588565826416016, -0.04301261901855469, -0.04143667221069336, -0.03986072540283203, -0.0382847785949707, -0.036708831787109375, -0.03513288497924805, -0.03355693817138672, -0.03198099136352539, -0.030405044555664062, -0.028829097747802734, -0.027253150939941406, -0.025677204132080078, -0.02410125732421875, -0.022525310516357422, -0.020949363708496094, -0.019373416900634766, -0.017797470092773438, -0.01622152328491211, -0.014645576477050781, -0.013069629669189453, -0.011493682861328125, -0.009917736053466797, -0.008341789245605469, -0.006765842437744141, -0.0051898956298828125, -0.0036139488220214844, -0.0020380020141601562, -0.0004620552062988281, 0.0011138916015625, 0.002689838409423828, 0.004265785217285156, 0.005841732025146484, 0.0074176788330078125, 0.00899362564086914, 0.010569572448730469, 0.012145519256591797, 0.013721466064453125, 0.015297412872314453, 0.01687335968017578, 0.01844930648803711, 0.020025253295898438, 0.021601200103759766, 0.023177146911621094, 0.024753093719482422, 0.02632904052734375, 0.027904987335205078, 0.029480934143066406, 0.031056880950927734, 0.03263282775878906, 0.03420877456665039, 0.03578472137451172, 0.03736066818237305, 0.038936614990234375, 0.0405125617980957, 0.04208850860595703, 0.04366445541381836, 0.04524040222167969, 0.046816349029541016, 0.048392295837402344, 0.04996824264526367, 0.051544189453125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 11.0, 606.0, 394.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.019307168200612068, -0.018949104472994804, -0.01859104074537754, -0.018232977017760277, -0.017874913290143013, -0.01751684956252575, -0.017158785834908485, -0.01680072210729122, -0.016442658379673958, -0.016084594652056694, -0.01572653092443943, -0.015368467196822166, -0.015010403469204903, -0.014652339741587639, -0.014294276013970375, -0.013936212286353111, -0.013578148558735847, -0.013220084831118584, -0.01286202110350132, -0.012503957375884056, -0.012145893648266792, -0.011787829920649529, -0.011429766193032265, -0.011071702465415001, -0.010713638737797737, -0.010355575010180473, -0.00999751128256321, -0.009639447554945946, -0.009281383827328682, -0.008923320099711418, -0.008565256372094154, -0.00820719264447689, -0.007849128916859627, -0.007491065189242363, -0.007133001461625099, -0.006774937734007835, -0.006416874006390572, -0.006058810278773308, -0.005700746551156044, -0.00534268282353878, -0.004984619095921516, -0.004626555368304253, -0.004268491640686989, -0.003910427913069725, -0.0035523641854524612, -0.0031943004578351974, -0.0028362367302179337, -0.00247817300260067, -0.002120109274983406, -0.0017620455473661423, -0.0014039818197488785, -0.0010459180921316147, -0.0006878543645143509, -0.0003297906368970871, 2.8273090720176697e-05, 0.0003863368183374405, 0.0007444005459547043, 0.001102464273571968, 0.0014605280011892319, 0.0018185917288064957, 0.0021766554564237595, 0.0025347191840410233, 0.002892782911658287, 0.003250846639275551, 0.0036089103668928146]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 8.0, 3.0, 6.0, 4.0, 15.0, 9.0, 15.0, 10.0, 14.0, 16.0, 17.0, 17.0, 20.0, 29.0, 26.0, 35.0, 34.0, 37.0, 31.0, 44.0, 45.0, 42.0, 30.0, 37.0, 35.0, 41.0, 50.0, 38.0, 34.0, 33.0, 26.0, 26.0, 22.0, 23.0, 18.0, 26.0, 15.0, 13.0, 7.0, 7.0, 7.0, 7.0, 3.0, 7.0, 7.0, 3.0, 5.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0], "bins": [-0.0011246800422668457, -0.0010912977159023285, -0.0010579153895378113, -0.001024533063173294, -0.0009911507368087769, -0.0009577684104442596, -0.0009243860840797424, -0.0008910037577152252, -0.000857621431350708, -0.0008242391049861908, -0.0007908567786216736, -0.0007574744522571564, -0.0007240921258926392, -0.000690709799528122, -0.0006573274731636047, -0.0006239451467990875, -0.0005905628204345703, -0.0005571804940700531, -0.0005237981677055359, -0.0004904158413410187, -0.00045703351497650146, -0.00042365118861198425, -0.00039026886224746704, -0.00035688653588294983, -0.0003235042095184326, -0.0002901218831539154, -0.0002567395567893982, -0.00022335723042488098, -0.00018997490406036377, -0.00015659257769584656, -0.00012321025133132935, -8.982792496681213e-05, -5.644559860229492e-05, -2.306327223777771e-05, 1.0319054126739502e-05, 4.3701380491256714e-05, 7.708370685577393e-05, 0.00011046603322029114, 0.00014384835958480835, 0.00017723068594932556, 0.00021061301231384277, 0.00024399533867835999, 0.0002773776650428772, 0.0003107599914073944, 0.0003441423177719116, 0.00037752464413642883, 0.00041090697050094604, 0.00044428929686546326, 0.00047767162322998047, 0.0005110539495944977, 0.0005444362759590149, 0.0005778186023235321, 0.0006112009286880493, 0.0006445832550525665, 0.0006779655814170837, 0.000711347907781601, 0.0007447302341461182, 0.0007781125605106354, 0.0008114948868751526, 0.0008448772132396698, 0.000878259539604187, 0.0009116418659687042, 0.0009450241923332214, 0.0009784065186977386, 0.0010117888450622559]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 4.0, 4.0, 8.0, 7.0, 7.0, 12.0, 13.0, 10.0, 11.0, 15.0, 23.0, 21.0, 17.0, 19.0, 26.0, 40.0, 30.0, 28.0, 26.0, 34.0, 32.0, 34.0, 36.0, 40.0, 49.0, 37.0, 39.0, 43.0, 41.0, 33.0, 37.0, 20.0, 30.0, 23.0, 18.0, 21.0, 18.0, 16.0, 13.0, 13.0, 8.0, 7.0, 9.0, 7.0, 2.0, 5.0, 4.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0], "bins": [-7.21875, -7.0072021484375, -6.795654296875, -6.5841064453125, -6.37255859375, -6.1610107421875, -5.949462890625, -5.7379150390625, -5.5263671875, -5.3148193359375, -5.103271484375, -4.8917236328125, -4.68017578125, -4.4686279296875, -4.257080078125, -4.0455322265625, -3.833984375, -3.6224365234375, -3.410888671875, -3.1993408203125, -2.98779296875, -2.7762451171875, -2.564697265625, -2.3531494140625, -2.1416015625, -1.9300537109375, -1.718505859375, -1.5069580078125, -1.29541015625, -1.0838623046875, -0.872314453125, -0.6607666015625, -0.44921875, -0.2376708984375, -0.026123046875, 0.1854248046875, 0.39697265625, 0.6085205078125, 0.820068359375, 1.0316162109375, 1.2431640625, 1.4547119140625, 1.666259765625, 1.8778076171875, 2.08935546875, 2.3009033203125, 2.512451171875, 2.7239990234375, 2.935546875, 3.1470947265625, 3.358642578125, 3.5701904296875, 3.78173828125, 3.9932861328125, 4.204833984375, 4.4163818359375, 4.6279296875, 4.8394775390625, 5.051025390625, 5.2625732421875, 5.47412109375, 5.6856689453125, 5.897216796875, 6.1087646484375, 6.3203125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 6.0, 6.0, 8.0, 12.0, 12.0, 21.0, 27.0, 33.0, 32.0, 65.0, 73.0, 121.0, 204.0, 381.0, 634.0, 1206.0, 2322.0, 4357.0, 8844.0, 18184.0, 41685.0, 103061.0, 280519.0, 352608.0, 135383.0, 53424.0, 23302.0, 10636.0, 5262.0, 2703.0, 1436.0, 777.0, 438.0, 258.0, 148.0, 99.0, 68.0, 52.0, 47.0, 18.0, 16.0, 15.0, 6.0, 10.0, 6.0, 6.0, 7.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0], "bins": [-6.1328125, -5.95318603515625, -5.7735595703125, -5.59393310546875, -5.414306640625, -5.23468017578125, -5.0550537109375, -4.87542724609375, -4.69580078125, -4.51617431640625, -4.3365478515625, -4.15692138671875, -3.977294921875, -3.79766845703125, -3.6180419921875, -3.43841552734375, -3.2587890625, -3.07916259765625, -2.8995361328125, -2.71990966796875, -2.540283203125, -2.36065673828125, -2.1810302734375, -2.00140380859375, -1.82177734375, -1.64215087890625, -1.4625244140625, -1.28289794921875, -1.103271484375, -0.92364501953125, -0.7440185546875, -0.56439208984375, -0.384765625, -0.20513916015625, -0.0255126953125, 0.15411376953125, 0.333740234375, 0.51336669921875, 0.6929931640625, 0.87261962890625, 1.05224609375, 1.23187255859375, 1.4114990234375, 1.59112548828125, 1.770751953125, 1.95037841796875, 2.1300048828125, 2.30963134765625, 2.4892578125, 2.66888427734375, 2.8485107421875, 3.02813720703125, 3.207763671875, 3.38739013671875, 3.5670166015625, 3.74664306640625, 3.92626953125, 4.10589599609375, 4.2855224609375, 4.46514892578125, 4.644775390625, 4.82440185546875, 5.0040283203125, 5.18365478515625, 5.36328125]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 3.0, 7.0, 4.0, 11.0, 11.0, 10.0, 8.0, 16.0, 19.0, 30.0, 26.0, 36.0, 35.0, 31.0, 42.0, 46.0, 51.0, 75.0, 167.0, 1661.0, 260.0, 85.0, 47.0, 51.0, 38.0, 35.0, 32.0, 30.0, 24.0, 35.0, 22.0, 15.0, 10.0, 9.0, 11.0, 10.0, 11.0, 5.0, 8.0, 4.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-26.59375, -25.826416015625, -25.05908203125, -24.291748046875, -23.5244140625, -22.757080078125, -21.98974609375, -21.222412109375, -20.455078125, -19.687744140625, -18.92041015625, -18.153076171875, -17.3857421875, -16.618408203125, -15.85107421875, -15.083740234375, -14.31640625, -13.549072265625, -12.78173828125, -12.014404296875, -11.2470703125, -10.479736328125, -9.71240234375, -8.945068359375, -8.177734375, -7.410400390625, -6.64306640625, -5.875732421875, -5.1083984375, -4.341064453125, -3.57373046875, -2.806396484375, -2.0390625, -1.271728515625, -0.50439453125, 0.262939453125, 1.0302734375, 1.797607421875, 2.56494140625, 3.332275390625, 4.099609375, 4.866943359375, 5.63427734375, 6.401611328125, 7.1689453125, 7.936279296875, 8.70361328125, 9.470947265625, 10.23828125, 11.005615234375, 11.77294921875, 12.540283203125, 13.3076171875, 14.074951171875, 14.84228515625, 15.609619140625, 16.376953125, 17.144287109375, 17.91162109375, 18.678955078125, 19.4462890625, 20.213623046875, 20.98095703125, 21.748291015625, 22.515625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 10.0, 10.0, 6.0, 8.0, 15.0, 16.0, 18.0, 19.0, 21.0, 40.0, 46.0, 71.0, 75.0, 98.0, 128.0, 174.0, 297.0, 483.0, 1200.0, 24803.0, 3036452.0, 77972.0, 2038.0, 567.0, 292.0, 218.0, 139.0, 115.0, 95.0, 68.0, 52.0, 41.0, 19.0, 17.0, 17.0, 11.0, 15.0, 11.0, 8.0, 5.0, 5.0, 5.0, 6.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.6875, -36.4150390625, -35.142578125, -33.8701171875, -32.59765625, -31.3251953125, -30.052734375, -28.7802734375, -27.5078125, -26.2353515625, -24.962890625, -23.6904296875, -22.41796875, -21.1455078125, -19.873046875, -18.6005859375, -17.328125, -16.0556640625, -14.783203125, -13.5107421875, -12.23828125, -10.9658203125, -9.693359375, -8.4208984375, -7.1484375, -5.8759765625, -4.603515625, -3.3310546875, -2.05859375, -0.7861328125, 0.486328125, 1.7587890625, 3.03125, 4.3037109375, 5.576171875, 6.8486328125, 8.12109375, 9.3935546875, 10.666015625, 11.9384765625, 13.2109375, 14.4833984375, 15.755859375, 17.0283203125, 18.30078125, 19.5732421875, 20.845703125, 22.1181640625, 23.390625, 24.6630859375, 25.935546875, 27.2080078125, 28.48046875, 29.7529296875, 31.025390625, 32.2978515625, 33.5703125, 34.8427734375, 36.115234375, 37.3876953125, 38.66015625, 39.9326171875, 41.205078125, 42.4775390625, 43.75]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 664.0, 353.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-563.2183837890625, -553.318603515625, -543.4188842773438, -533.5191040039062, -523.619384765625, -513.7196044921875, -503.8198547363281, -493.92010498046875, -484.02032470703125, -474.1205749511719, -464.2208251953125, -454.321044921875, -444.4212951660156, -434.52154541015625, -424.6217956542969, -414.7220458984375, -404.822265625, -394.9225158691406, -385.02276611328125, -375.12298583984375, -365.2232360839844, -355.323486328125, -345.4237365722656, -335.52398681640625, -325.6242370605469, -315.7244873046875, -305.8247375488281, -295.9249572753906, -286.02520751953125, -276.1254577636719, -266.2257080078125, -256.325927734375, -246.4261932373047, -236.5264434814453, -226.62667846679688, -216.7269287109375, -206.82716369628906, -196.9274139404297, -187.02764892578125, -177.12789916992188, -167.2281494140625, -157.32839965820312, -147.4286346435547, -137.5288848876953, -127.62911987304688, -117.7293701171875, -107.8296127319336, -97.92985534667969, -88.03009033203125, -78.13033294677734, -68.23057556152344, -58.3308219909668, -48.43106460571289, -38.531307220458984, -28.631553649902344, -18.731796264648438, -8.832038879394531, 1.0677175521850586, 10.967473983764648, 20.867229461669922, 30.766986846923828, 40.666744232177734, 50.566497802734375, 60.46625518798828, 70.36601257324219]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 8.0, 4.0, 8.0, 9.0, 11.0, 14.0, 15.0, 15.0, 21.0, 20.0, 23.0, 31.0, 29.0, 32.0, 26.0, 37.0, 42.0, 30.0, 33.0, 34.0, 41.0, 32.0, 35.0, 35.0, 39.0, 49.0, 38.0, 31.0, 41.0, 22.0, 22.0, 18.0, 23.0, 20.0, 14.0, 19.0, 19.0, 13.0, 6.0, 9.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-52.26874542236328, -50.4813232421875, -48.69390106201172, -46.90647888183594, -45.11906051635742, -43.33163833618164, -41.54421615600586, -39.75679397583008, -37.96937561035156, -36.18195343017578, -34.39453125, -32.60710906982422, -30.819690704345703, -29.032268524169922, -27.24484634399414, -25.45742416381836, -23.670001983642578, -21.882579803466797, -20.09515953063965, -18.307737350463867, -16.52031707763672, -14.732894897460938, -12.945472717285156, -11.158051490783691, -9.370630264282227, -7.583209037780762, -5.795787334442139, -4.008365631103516, -2.220944404602051, -0.43352317810058594, 1.3538990020751953, 3.14132022857666, 4.928741455078125, 6.71616268157959, 8.503583908081055, 10.291006088256836, 12.0784273147583, 13.865848541259766, 15.653270721435547, 17.440692901611328, 19.228113174438477, 21.015535354614258, 22.802955627441406, 24.590377807617188, 26.37779998779297, 28.165220260620117, 29.9526424407959, 31.740062713623047, 33.52748489379883, 35.31490707397461, 37.10232925415039, 38.889747619628906, 40.67716979980469, 42.46459197998047, 44.25201416015625, 46.03943634033203, 47.82685852050781, 49.614280700683594, 51.401702880859375, 53.189125061035156, 54.97654342651367, 56.76396560668945, 58.551387786865234, 60.338809967041016, 62.12622833251953]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 10.0, 6.0, 9.0, 6.0, 9.0, 11.0, 14.0, 6.0, 18.0, 15.0, 19.0, 18.0, 24.0, 25.0, 31.0, 28.0, 38.0, 28.0, 25.0, 33.0, 37.0, 40.0, 42.0, 38.0, 42.0, 44.0, 48.0, 45.0, 36.0, 25.0, 22.0, 25.0, 26.0, 22.0, 18.0, 18.0, 18.0, 16.0, 13.0, 8.0, 6.0, 10.0, 7.0, 3.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-7.39453125, -7.173583984375, -6.95263671875, -6.731689453125, -6.5107421875, -6.289794921875, -6.06884765625, -5.847900390625, -5.626953125, -5.406005859375, -5.18505859375, -4.964111328125, -4.7431640625, -4.522216796875, -4.30126953125, -4.080322265625, -3.859375, -3.638427734375, -3.41748046875, -3.196533203125, -2.9755859375, -2.754638671875, -2.53369140625, -2.312744140625, -2.091796875, -1.870849609375, -1.64990234375, -1.428955078125, -1.2080078125, -0.987060546875, -0.76611328125, -0.545166015625, -0.32421875, -0.103271484375, 0.11767578125, 0.338623046875, 0.5595703125, 0.780517578125, 1.00146484375, 1.222412109375, 1.443359375, 1.664306640625, 1.88525390625, 2.106201171875, 2.3271484375, 2.548095703125, 2.76904296875, 2.989990234375, 3.2109375, 3.431884765625, 3.65283203125, 3.873779296875, 4.0947265625, 4.315673828125, 4.53662109375, 4.757568359375, 4.978515625, 5.199462890625, 5.42041015625, 5.641357421875, 5.8623046875, 6.083251953125, 6.30419921875, 6.525146484375, 6.74609375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 8.0, 5.0, 9.0, 11.0, 16.0, 15.0, 17.0, 19.0, 23.0, 27.0, 29.0, 41.0, 42.0, 60.0, 86.0, 136.0, 258.0, 634.0, 2561.0, 19715.0, 496574.0, 3285645.0, 368519.0, 16200.0, 2303.0, 552.0, 221.0, 141.0, 80.0, 63.0, 54.0, 42.0, 33.0, 26.0, 18.0, 25.0, 8.0, 13.0, 10.0, 8.0, 6.0, 7.0, 5.0, 4.0, 1.0, 5.0, 5.0, 1.0, 4.0, 0.0, 2.0], "bins": [-23.78125, -23.091064453125, -22.40087890625, -21.710693359375, -21.0205078125, -20.330322265625, -19.64013671875, -18.949951171875, -18.259765625, -17.569580078125, -16.87939453125, -16.189208984375, -15.4990234375, -14.808837890625, -14.11865234375, -13.428466796875, -12.73828125, -12.048095703125, -11.35791015625, -10.667724609375, -9.9775390625, -9.287353515625, -8.59716796875, -7.906982421875, -7.216796875, -6.526611328125, -5.83642578125, -5.146240234375, -4.4560546875, -3.765869140625, -3.07568359375, -2.385498046875, -1.6953125, -1.005126953125, -0.31494140625, 0.375244140625, 1.0654296875, 1.755615234375, 2.44580078125, 3.135986328125, 3.826171875, 4.516357421875, 5.20654296875, 5.896728515625, 6.5869140625, 7.277099609375, 7.96728515625, 8.657470703125, 9.34765625, 10.037841796875, 10.72802734375, 11.418212890625, 12.1083984375, 12.798583984375, 13.48876953125, 14.178955078125, 14.869140625, 15.559326171875, 16.24951171875, 16.939697265625, 17.6298828125, 18.320068359375, 19.01025390625, 19.700439453125, 20.390625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 4.0, 3.0, 3.0, 9.0, 8.0, 12.0, 11.0, 19.0, 20.0, 26.0, 36.0, 39.0, 55.0, 74.0, 113.0, 141.0, 169.0, 225.0, 275.0, 386.0, 413.0, 405.0, 370.0, 307.0, 255.0, 173.0, 140.0, 87.0, 60.0, 64.0, 47.0, 30.0, 24.0, 23.0, 11.0, 15.0, 6.0, 9.0, 1.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.828857421875, -11.47021484375, -11.111572265625, -10.7529296875, -10.394287109375, -10.03564453125, -9.677001953125, -9.318359375, -8.959716796875, -8.60107421875, -8.242431640625, -7.8837890625, -7.525146484375, -7.16650390625, -6.807861328125, -6.44921875, -6.090576171875, -5.73193359375, -5.373291015625, -5.0146484375, -4.656005859375, -4.29736328125, -3.938720703125, -3.580078125, -3.221435546875, -2.86279296875, -2.504150390625, -2.1455078125, -1.786865234375, -1.42822265625, -1.069580078125, -0.7109375, -0.352294921875, 0.00634765625, 0.364990234375, 0.7236328125, 1.082275390625, 1.44091796875, 1.799560546875, 2.158203125, 2.516845703125, 2.87548828125, 3.234130859375, 3.5927734375, 3.951416015625, 4.31005859375, 4.668701171875, 5.02734375, 5.385986328125, 5.74462890625, 6.103271484375, 6.4619140625, 6.820556640625, 7.17919921875, 7.537841796875, 7.896484375, 8.255126953125, 8.61376953125, 8.972412109375, 9.3310546875, 9.689697265625, 10.04833984375, 10.406982421875, 10.765625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 9.0, 6.0, 1.0, 8.0, 2.0, 11.0, 19.0, 18.0, 20.0, 32.0, 43.0, 45.0, 73.0, 88.0, 108.0, 148.0, 155.0, 268.0, 409.0, 905.0, 5662.0, 193772.0, 3893590.0, 92917.0, 3839.0, 778.0, 350.0, 239.0, 156.0, 131.0, 107.0, 78.0, 58.0, 63.0, 38.0, 29.0, 23.0, 25.0, 16.0, 14.0, 3.0, 9.0, 10.0, 5.0, 2.0, 5.0, 1.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.25, -38.7265625, -37.203125, -35.6796875, -34.15625, -32.6328125, -31.109375, -29.5859375, -28.0625, -26.5390625, -25.015625, -23.4921875, -21.96875, -20.4453125, -18.921875, -17.3984375, -15.875, -14.3515625, -12.828125, -11.3046875, -9.78125, -8.2578125, -6.734375, -5.2109375, -3.6875, -2.1640625, -0.640625, 0.8828125, 2.40625, 3.9296875, 5.453125, 6.9765625, 8.5, 10.0234375, 11.546875, 13.0703125, 14.59375, 16.1171875, 17.640625, 19.1640625, 20.6875, 22.2109375, 23.734375, 25.2578125, 26.78125, 28.3046875, 29.828125, 31.3515625, 32.875, 34.3984375, 35.921875, 37.4453125, 38.96875, 40.4921875, 42.015625, 43.5390625, 45.0625, 46.5859375, 48.109375, 49.6328125, 51.15625, 52.6796875, 54.203125, 55.7265625, 57.25]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 44.0, 187.0, 399.0, 300.0, 67.0, 16.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.08457946777344, -54.49012756347656, -48.89567565917969, -43.30122756958008, -37.7067756652832, -32.11232376098633, -26.51787567138672, -20.923423767089844, -15.328971862792969, -9.73452091217041, -4.140069961547852, 1.4543800354003906, 7.048831939697266, 12.64328384399414, 18.23773193359375, 23.832183837890625, 29.4266357421875, 35.021087646484375, 40.61553955078125, 46.20998764038086, 51.804439544677734, 57.39889144897461, 62.99333953857422, 68.5877914428711, 74.18224334716797, 79.77669525146484, 85.37114715576172, 90.96559143066406, 96.56004333496094, 102.15449523925781, 107.74894714355469, 113.34339904785156, 118.93783569335938, 124.53228759765625, 130.12673950195312, 135.72119140625, 141.31564331054688, 146.91009521484375, 152.50454711914062, 158.0989990234375, 163.69345092773438, 169.28790283203125, 174.88235473632812, 180.476806640625, 186.07125854492188, 191.66571044921875, 197.26016235351562, 202.8546142578125, 208.4490509033203, 214.0435028076172, 219.63795471191406, 225.23240661621094, 230.8268585205078, 236.4213104248047, 242.0157470703125, 247.61019897460938, 253.20465087890625, 258.7991027832031, 264.3935546875, 269.9880065917969, 275.58245849609375, 281.1769104003906, 286.7713623046875, 292.3658142089844, 297.96026611328125]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 4.0, 3.0, 7.0, 8.0, 11.0, 10.0, 15.0, 13.0, 18.0, 20.0, 25.0, 26.0, 30.0, 29.0, 26.0, 40.0, 30.0, 42.0, 49.0, 54.0, 33.0, 53.0, 41.0, 46.0, 39.0, 39.0, 37.0, 34.0, 24.0, 43.0, 22.0, 15.0, 22.0, 12.0, 14.0, 9.0, 12.0, 8.0, 6.0, 13.0, 6.0, 3.0, 3.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-37.6015625, -36.27720642089844, -34.95284652709961, -33.62849044799805, -32.30413055419922, -30.979774475097656, -29.65541648864746, -28.331058502197266, -27.006702423095703, -25.682344436645508, -24.357986450195312, -23.03363037109375, -21.709272384643555, -20.38491439819336, -19.060556411743164, -17.73619842529297, -16.411840438842773, -15.087482452392578, -13.7631254196167, -12.438767433166504, -11.114410400390625, -9.79005241394043, -8.465694427490234, -7.1413373947143555, -5.81697940826416, -4.492621898651123, -3.168264150619507, -1.8439064025878906, -0.5195488929748535, 0.8048086166381836, 2.129166603088379, 3.453523635864258, 4.777881622314453, 6.10223913192749, 7.426596641540527, 8.750954627990723, 10.075311660766602, 11.399669647216797, 12.724027633666992, 14.048384666442871, 15.372742652893066, 16.697099685668945, 18.02145767211914, 19.345815658569336, 20.67017364501953, 21.994529724121094, 23.318889617919922, 24.643245697021484, 25.96760368347168, 27.291961669921875, 28.61631965637207, 29.940677642822266, 31.265033721923828, 32.589393615722656, 33.91374969482422, 35.23810577392578, 36.56246566772461, 37.88682174682617, 39.211181640625, 40.53553771972656, 41.85989761352539, 43.18425369262695, 44.50861358642578, 45.832969665527344, 47.157325744628906]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 6.0, 11.0, 9.0, 17.0, 20.0, 18.0, 14.0, 26.0, 23.0, 23.0, 18.0, 23.0, 32.0, 29.0, 36.0, 27.0, 43.0, 32.0, 33.0, 51.0, 31.0, 47.0, 40.0, 33.0, 40.0, 42.0, 30.0, 24.0, 22.0, 14.0, 22.0, 22.0, 22.0, 16.0, 11.0, 10.0, 13.0, 9.0, 6.0, 5.0, 1.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0], "bins": [-7.6171875, -7.40386962890625, -7.1905517578125, -6.97723388671875, -6.763916015625, -6.55059814453125, -6.3372802734375, -6.12396240234375, -5.91064453125, -5.69732666015625, -5.4840087890625, -5.27069091796875, -5.057373046875, -4.84405517578125, -4.6307373046875, -4.41741943359375, -4.2041015625, -3.99078369140625, -3.7774658203125, -3.56414794921875, -3.350830078125, -3.13751220703125, -2.9241943359375, -2.71087646484375, -2.49755859375, -2.28424072265625, -2.0709228515625, -1.85760498046875, -1.644287109375, -1.43096923828125, -1.2176513671875, -1.00433349609375, -0.791015625, -0.57769775390625, -0.3643798828125, -0.15106201171875, 0.062255859375, 0.27557373046875, 0.4888916015625, 0.70220947265625, 0.91552734375, 1.12884521484375, 1.3421630859375, 1.55548095703125, 1.768798828125, 1.98211669921875, 2.1954345703125, 2.40875244140625, 2.6220703125, 2.83538818359375, 3.0487060546875, 3.26202392578125, 3.475341796875, 3.68865966796875, 3.9019775390625, 4.11529541015625, 4.32861328125, 4.54193115234375, 4.7552490234375, 4.96856689453125, 5.181884765625, 5.39520263671875, 5.6085205078125, 5.82183837890625, 6.03515625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 9.0, 2.0, 12.0, 9.0, 19.0, 31.0, 30.0, 50.0, 81.0, 115.0, 147.0, 226.0, 366.0, 537.0, 706.0, 1072.0, 1478.0, 2193.0, 3230.0, 4627.0, 6932.0, 10253.0, 15517.0, 23915.0, 38271.0, 62483.0, 103477.0, 162572.0, 197454.0, 154030.0, 96781.0, 58534.0, 35754.0, 22403.0, 14613.0, 9735.0, 6592.0, 4484.0, 3038.0, 2136.0, 1422.0, 999.0, 646.0, 463.0, 364.0, 226.0, 172.0, 124.0, 90.0, 61.0, 24.0, 21.0, 19.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0], "bins": [-0.7294921875, -0.707672119140625, -0.68585205078125, -0.664031982421875, -0.6422119140625, -0.620391845703125, -0.59857177734375, -0.576751708984375, -0.554931640625, -0.533111572265625, -0.51129150390625, -0.489471435546875, -0.4676513671875, -0.445831298828125, -0.42401123046875, -0.402191162109375, -0.38037109375, -0.358551025390625, -0.33673095703125, -0.314910888671875, -0.2930908203125, -0.271270751953125, -0.24945068359375, -0.227630615234375, -0.205810546875, -0.183990478515625, -0.16217041015625, -0.140350341796875, -0.1185302734375, -0.096710205078125, -0.07489013671875, -0.053070068359375, -0.03125, -0.009429931640625, 0.01239013671875, 0.034210205078125, 0.0560302734375, 0.077850341796875, 0.09967041015625, 0.121490478515625, 0.143310546875, 0.165130615234375, 0.18695068359375, 0.208770751953125, 0.2305908203125, 0.252410888671875, 0.27423095703125, 0.296051025390625, 0.31787109375, 0.339691162109375, 0.36151123046875, 0.383331298828125, 0.4051513671875, 0.426971435546875, 0.44879150390625, 0.470611572265625, 0.492431640625, 0.514251708984375, 0.53607177734375, 0.557891845703125, 0.5797119140625, 0.601531982421875, 0.62335205078125, 0.645172119140625, 0.6669921875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 10.0, 8.0, 5.0, 22.0, 17.0, 29.0, 16.0, 19.0, 37.0, 29.0, 28.0, 27.0, 41.0, 37.0, 51.0, 44.0, 43.0, 1064.0, 48.0, 46.0, 31.0, 41.0, 30.0, 42.0, 32.0, 31.0, 31.0, 30.0, 13.0, 18.0, 16.0, 21.0, 13.0, 9.0, 7.0, 8.0, 9.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.19921875, -5.03900146484375, -4.8787841796875, -4.71856689453125, -4.558349609375, -4.39813232421875, -4.2379150390625, -4.07769775390625, -3.91748046875, -3.75726318359375, -3.5970458984375, -3.43682861328125, -3.276611328125, -3.11639404296875, -2.9561767578125, -2.79595947265625, -2.6357421875, -2.47552490234375, -2.3153076171875, -2.15509033203125, -1.994873046875, -1.83465576171875, -1.6744384765625, -1.51422119140625, -1.35400390625, -1.19378662109375, -1.0335693359375, -0.87335205078125, -0.713134765625, -0.55291748046875, -0.3927001953125, -0.23248291015625, -0.072265625, 0.08795166015625, 0.2481689453125, 0.40838623046875, 0.568603515625, 0.72882080078125, 0.8890380859375, 1.04925537109375, 1.20947265625, 1.36968994140625, 1.5299072265625, 1.69012451171875, 1.850341796875, 2.01055908203125, 2.1707763671875, 2.33099365234375, 2.4912109375, 2.65142822265625, 2.8116455078125, 2.97186279296875, 3.132080078125, 3.29229736328125, 3.4525146484375, 3.61273193359375, 3.77294921875, 3.93316650390625, 4.0933837890625, 4.25360107421875, 4.413818359375, 4.57403564453125, 4.7342529296875, 4.89447021484375, 5.0546875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 2.0, 7.0, 11.0, 20.0, 24.0, 45.0, 54.0, 89.0, 150.0, 193.0, 308.0, 476.0, 769.0, 1136.0, 1753.0, 2769.0, 4504.0, 6926.0, 11234.0, 19183.0, 32644.0, 57231.0, 98734.0, 160735.0, 1256172.0, 174961.0, 110518.0, 64531.0, 36785.0, 21273.0, 12723.0, 7856.0, 4814.0, 3048.0, 1903.0, 1208.0, 808.0, 537.0, 343.0, 222.0, 154.0, 85.0, 61.0, 38.0, 33.0, 18.0, 20.0, 4.0, 4.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.72900390625, -0.7059402465820312, -0.6828765869140625, -0.6598129272460938, -0.636749267578125, -0.6136856079101562, -0.5906219482421875, -0.5675582885742188, -0.54449462890625, -0.5214309692382812, -0.4983673095703125, -0.47530364990234375, -0.452239990234375, -0.42917633056640625, -0.4061126708984375, -0.38304901123046875, -0.3599853515625, -0.33692169189453125, -0.3138580322265625, -0.29079437255859375, -0.267730712890625, -0.24466705322265625, -0.2216033935546875, -0.19853973388671875, -0.17547607421875, -0.15241241455078125, -0.1293487548828125, -0.10628509521484375, -0.083221435546875, -0.06015777587890625, -0.0370941162109375, -0.01403045654296875, 0.009033203125, 0.03209686279296875, 0.0551605224609375, 0.07822418212890625, 0.101287841796875, 0.12435150146484375, 0.1474151611328125, 0.17047882080078125, 0.19354248046875, 0.21660614013671875, 0.2396697998046875, 0.26273345947265625, 0.285797119140625, 0.30886077880859375, 0.3319244384765625, 0.35498809814453125, 0.3780517578125, 0.40111541748046875, 0.4241790771484375, 0.44724273681640625, 0.470306396484375, 0.49337005615234375, 0.5164337158203125, 0.5394973754882812, 0.56256103515625, 0.5856246948242188, 0.6086883544921875, 0.6317520141601562, 0.654815673828125, 0.6778793334960938, 0.7009429931640625, 0.7240066528320312, 0.7470703125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 3.0, 14.0, 14.0, 13.0, 14.0, 19.0, 17.0, 26.0, 26.0, 41.0, 45.0, 52.0, 50.0, 51.0, 49.0, 52.0, 52.0, 56.0, 58.0, 43.0, 38.0, 56.0, 24.0, 24.0, 30.0, 24.0, 18.0, 13.0, 11.0, 12.0, 8.0, 10.0, 4.0, 8.0, 6.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.002063751220703125, -0.0020025670528411865, -0.001941382884979248, -0.0018801987171173096, -0.001819014549255371, -0.0017578303813934326, -0.0016966462135314941, -0.0016354620456695557, -0.0015742778778076172, -0.0015130937099456787, -0.0014519095420837402, -0.0013907253742218018, -0.0013295412063598633, -0.0012683570384979248, -0.0012071728706359863, -0.0011459887027740479, -0.0010848045349121094, -0.001023620367050171, -0.0009624361991882324, -0.0009012520313262939, -0.0008400678634643555, -0.000778883695602417, -0.0007176995277404785, -0.00065651535987854, -0.0005953311920166016, -0.0005341470241546631, -0.0004729628562927246, -0.00041177868843078613, -0.00035059452056884766, -0.0002894103527069092, -0.0002282261848449707, -0.00016704201698303223, -0.00010585784912109375, -4.4673681259155273e-05, 1.6510486602783203e-05, 7.769465446472168e-05, 0.00013887882232666016, 0.00020006299018859863, 0.0002612471580505371, 0.0003224313259124756, 0.00038361549377441406, 0.00044479966163635254, 0.000505983829498291, 0.0005671679973602295, 0.000628352165222168, 0.0006895363330841064, 0.0007507205009460449, 0.0008119046688079834, 0.0008730888366699219, 0.0009342730045318604, 0.0009954571723937988, 0.0010566413402557373, 0.0011178255081176758, 0.0011790096759796143, 0.0012401938438415527, 0.0013013780117034912, 0.0013625621795654297, 0.0014237463474273682, 0.0014849305152893066, 0.0015461146831512451, 0.0016072988510131836, 0.001668483018875122, 0.0017296671867370605, 0.001790851354598999, 0.0018520355224609375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 13.0, 10.0, 13.0, 9.0, 13.0, 19.0, 27.0, 32.0, 43.0, 48.0, 58.0, 79.0, 101.0, 164.0, 303.0, 539.0, 1612.0, 781688.0, 261327.0, 1163.0, 466.0, 265.0, 133.0, 83.0, 77.0, 51.0, 39.0, 39.0, 29.0, 22.0, 18.0, 16.0, 14.0, 7.0, 7.0, 8.0, 5.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.040863037109375, -0.039540767669677734, -0.03821849822998047, -0.0368962287902832, -0.03557395935058594, -0.03425168991088867, -0.032929420471191406, -0.03160715103149414, -0.030284881591796875, -0.02896261215209961, -0.027640342712402344, -0.026318073272705078, -0.024995803833007812, -0.023673534393310547, -0.02235126495361328, -0.021028995513916016, -0.01970672607421875, -0.018384456634521484, -0.01706218719482422, -0.015739917755126953, -0.014417648315429688, -0.013095378875732422, -0.011773109436035156, -0.01045083999633789, -0.009128570556640625, -0.007806301116943359, -0.006484031677246094, -0.005161762237548828, -0.0038394927978515625, -0.002517223358154297, -0.0011949539184570312, 0.00012731552124023438, 0.0014495849609375, 0.0027718544006347656, 0.004094123840332031, 0.005416393280029297, 0.0067386627197265625, 0.008060932159423828, 0.009383201599121094, 0.01070547103881836, 0.012027740478515625, 0.01335000991821289, 0.014672279357910156, 0.015994548797607422, 0.017316818237304688, 0.018639087677001953, 0.01996135711669922, 0.021283626556396484, 0.02260589599609375, 0.023928165435791016, 0.02525043487548828, 0.026572704315185547, 0.027894973754882812, 0.029217243194580078, 0.030539512634277344, 0.03186178207397461, 0.033184051513671875, 0.03450632095336914, 0.035828590393066406, 0.03715085983276367, 0.03847312927246094, 0.0397953987121582, 0.04111766815185547, 0.042439937591552734, 0.04376220703125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 13.0, 64.0, 263.0, 415.0, 198.0, 52.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005845477804541588, -0.005707615055143833, -0.005569752771407366, -0.005431890022009611, -0.005294027738273144, -0.005156164988875389, -0.005018302705138922, -0.004880439955741167, -0.0047425776720047, -0.004604714922606945, -0.004466852638870478, -0.004328989889472723, -0.004191127605736256, -0.004053264856338501, -0.003915402572602034, -0.003777539823204279, -0.0036396770738065243, -0.0035018145572394133, -0.0033639520406723022, -0.0032260895241051912, -0.00308822700753808, -0.0029503642581403255, -0.0028125017415732145, -0.0026746392250061035, -0.0025367767084389925, -0.0023989141918718815, -0.0022610516753047705, -0.0021231891587376595, -0.001985326409339905, -0.0018474640091881156, -0.0017096013762056828, -0.0015717388596385717, -0.001433876808732748, -0.001296014292165637, -0.001158151775598526, -0.0010202891426160932, -0.0008824266260489821, -0.0007445641094818711, -0.0006067015347070992, -0.00046883895993232727, -0.00033097644336521626, -0.00019311389769427478, -5.525135202333331e-05, 8.261119364760816e-05, 0.00022047373931854963, 0.00035833625588566065, 0.0004961988306604326, 0.0006340614054352045, 0.0007719239220023155, 0.0009097864385694265, 0.0010476489551365376, 0.0011855115881189704, 0.0013233741046860814, 0.0014612366212531924, 0.0015990992542356253, 0.0017369617708027363, 0.0018748242873698473, 0.0020126868039369583, 0.0021505493205040693, 0.0022884118370711803, 0.002426274586468935, 0.0025641368702054024, 0.002701999619603157, 0.002839862136170268, 0.002977724652737379]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 2.0, 2.0, 8.0, 4.0, 13.0, 11.0, 14.0, 13.0, 18.0, 11.0, 25.0, 24.0, 29.0, 27.0, 30.0, 27.0, 38.0, 37.0, 36.0, 36.0, 36.0, 41.0, 50.0, 43.0, 39.0, 44.0, 34.0, 37.0, 24.0, 24.0, 25.0, 33.0, 26.0, 20.0, 25.0, 22.0, 17.0, 13.0, 14.0, 5.0, 7.0, 11.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001056075096130371, -0.0010235235095024109, -0.0009909719228744507, -0.0009584203362464905, -0.0009258687496185303, -0.0008933171629905701, -0.0008607655763626099, -0.0008282139897346497, -0.0007956624031066895, -0.0007631108164787292, -0.000730559229850769, -0.0006980076432228088, -0.0006654560565948486, -0.0006329044699668884, -0.0006003528833389282, -0.000567801296710968, -0.0005352497100830078, -0.0005026981234550476, -0.0004701465368270874, -0.0004375949501991272, -0.000405043363571167, -0.0003724917769432068, -0.0003399401903152466, -0.0003073886036872864, -0.00027483701705932617, -0.00024228543043136597, -0.00020973384380340576, -0.00017718225717544556, -0.00014463067054748535, -0.00011207908391952515, -7.952749729156494e-05, -4.6975910663604736e-05, -1.4424324035644531e-05, 1.8127262592315674e-05, 5.067884922027588e-05, 8.323043584823608e-05, 0.00011578202247619629, 0.0001483336091041565, 0.0001808851957321167, 0.0002134367823600769, 0.0002459883689880371, 0.0002785399556159973, 0.0003110915422439575, 0.0003436431288719177, 0.00037619471549987793, 0.00040874630212783813, 0.00044129788875579834, 0.00047384947538375854, 0.0005064010620117188, 0.000538952648639679, 0.0005715042352676392, 0.0006040558218955994, 0.0006366074085235596, 0.0006691589951515198, 0.00070171058177948, 0.0007342621684074402, 0.0007668137550354004, 0.0007993653416633606, 0.0008319169282913208, 0.000864468514919281, 0.0008970201015472412, 0.0009295716881752014, 0.0009621232748031616, 0.0009946748614311218, 0.001027226448059082]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 4.0, 2.0, 3.0, 7.0, 8.0, 11.0, 6.0, 11.0, 9.0, 17.0, 20.0, 17.0, 15.0, 26.0, 23.0, 23.0, 18.0, 23.0, 32.0, 29.0, 36.0, 27.0, 43.0, 32.0, 33.0, 51.0, 31.0, 46.0, 41.0, 33.0, 40.0, 42.0, 30.0, 24.0, 22.0, 14.0, 22.0, 22.0, 22.0, 16.0, 11.0, 10.0, 13.0, 9.0, 6.0, 5.0, 1.0, 4.0, 4.0, 2.0, 5.0, 2.0, 3.0], "bins": [-7.6171875, -7.40386962890625, -7.1905517578125, -6.97723388671875, -6.763916015625, -6.55059814453125, -6.3372802734375, -6.12396240234375, -5.91064453125, -5.69732666015625, -5.4840087890625, -5.27069091796875, -5.057373046875, -4.84405517578125, -4.6307373046875, -4.41741943359375, -4.2041015625, -3.99078369140625, -3.7774658203125, -3.56414794921875, -3.350830078125, -3.13751220703125, -2.9241943359375, -2.71087646484375, -2.49755859375, -2.28424072265625, -2.0709228515625, -1.85760498046875, -1.644287109375, -1.43096923828125, -1.2176513671875, -1.00433349609375, -0.791015625, -0.57769775390625, -0.3643798828125, -0.15106201171875, 0.062255859375, 0.27557373046875, 0.4888916015625, 0.70220947265625, 0.91552734375, 1.12884521484375, 1.3421630859375, 1.55548095703125, 1.768798828125, 1.98211669921875, 2.1954345703125, 2.40875244140625, 2.6220703125, 2.83538818359375, 3.0487060546875, 3.26202392578125, 3.475341796875, 3.68865966796875, 3.9019775390625, 4.11529541015625, 4.32861328125, 4.54193115234375, 4.7552490234375, 4.96856689453125, 5.181884765625, 5.39520263671875, 5.6085205078125, 5.82183837890625, 6.03515625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 1.0, 9.0, 8.0, 12.0, 10.0, 11.0, 19.0, 28.0, 17.0, 42.0, 46.0, 56.0, 71.0, 103.0, 115.0, 166.0, 253.0, 437.0, 877.0, 2908.0, 13072.0, 82126.0, 709420.0, 205612.0, 24882.0, 5175.0, 1384.0, 550.0, 317.0, 198.0, 160.0, 104.0, 61.0, 51.0, 55.0, 44.0, 37.0, 17.0, 17.0, 13.0, 18.0, 10.0, 7.0, 7.0, 2.0, 6.0, 6.0, 0.0, 6.0, 3.0, 2.0], "bins": [-15.171875, -14.746826171875, -14.32177734375, -13.896728515625, -13.4716796875, -13.046630859375, -12.62158203125, -12.196533203125, -11.771484375, -11.346435546875, -10.92138671875, -10.496337890625, -10.0712890625, -9.646240234375, -9.22119140625, -8.796142578125, -8.37109375, -7.946044921875, -7.52099609375, -7.095947265625, -6.6708984375, -6.245849609375, -5.82080078125, -5.395751953125, -4.970703125, -4.545654296875, -4.12060546875, -3.695556640625, -3.2705078125, -2.845458984375, -2.42041015625, -1.995361328125, -1.5703125, -1.145263671875, -0.72021484375, -0.295166015625, 0.1298828125, 0.554931640625, 0.97998046875, 1.405029296875, 1.830078125, 2.255126953125, 2.68017578125, 3.105224609375, 3.5302734375, 3.955322265625, 4.38037109375, 4.805419921875, 5.23046875, 5.655517578125, 6.08056640625, 6.505615234375, 6.9306640625, 7.355712890625, 7.78076171875, 8.205810546875, 8.630859375, 9.055908203125, 9.48095703125, 9.906005859375, 10.3310546875, 10.756103515625, 11.18115234375, 11.606201171875, 12.03125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 4.0, 5.0, 3.0, 4.0, 7.0, 8.0, 5.0, 10.0, 10.0, 12.0, 17.0, 23.0, 29.0, 30.0, 32.0, 26.0, 37.0, 44.0, 35.0, 44.0, 66.0, 113.0, 296.0, 1552.0, 147.0, 69.0, 58.0, 44.0, 32.0, 38.0, 29.0, 29.0, 39.0, 28.0, 22.0, 21.0, 15.0, 13.0, 17.0, 3.0, 8.0, 10.0, 7.0, 3.0, 0.0, 2.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-23.4375, -22.751708984375, -22.06591796875, -21.380126953125, -20.6943359375, -20.008544921875, -19.32275390625, -18.636962890625, -17.951171875, -17.265380859375, -16.57958984375, -15.893798828125, -15.2080078125, -14.522216796875, -13.83642578125, -13.150634765625, -12.46484375, -11.779052734375, -11.09326171875, -10.407470703125, -9.7216796875, -9.035888671875, -8.35009765625, -7.664306640625, -6.978515625, -6.292724609375, -5.60693359375, -4.921142578125, -4.2353515625, -3.549560546875, -2.86376953125, -2.177978515625, -1.4921875, -0.806396484375, -0.12060546875, 0.565185546875, 1.2509765625, 1.936767578125, 2.62255859375, 3.308349609375, 3.994140625, 4.679931640625, 5.36572265625, 6.051513671875, 6.7373046875, 7.423095703125, 8.10888671875, 8.794677734375, 9.48046875, 10.166259765625, 10.85205078125, 11.537841796875, 12.2236328125, 12.909423828125, 13.59521484375, 14.281005859375, 14.966796875, 15.652587890625, 16.33837890625, 17.024169921875, 17.7099609375, 18.395751953125, 19.08154296875, 19.767333984375, 20.453125]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 3.0, 8.0, 3.0, 11.0, 10.0, 12.0, 18.0, 22.0, 27.0, 28.0, 37.0, 44.0, 48.0, 58.0, 89.0, 122.0, 211.0, 369.0, 858.0, 6261.0, 2988021.0, 145695.0, 2254.0, 578.0, 270.0, 173.0, 124.0, 63.0, 49.0, 51.0, 47.0, 30.0, 20.0, 12.0, 19.0, 10.0, 13.0, 7.0, 8.0, 4.0, 7.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.5, -45.90625, -44.3125, -42.71875, -41.125, -39.53125, -37.9375, -36.34375, -34.75, -33.15625, -31.5625, -29.96875, -28.375, -26.78125, -25.1875, -23.59375, -22.0, -20.40625, -18.8125, -17.21875, -15.625, -14.03125, -12.4375, -10.84375, -9.25, -7.65625, -6.0625, -4.46875, -2.875, -1.28125, 0.3125, 1.90625, 3.5, 5.09375, 6.6875, 8.28125, 9.875, 11.46875, 13.0625, 14.65625, 16.25, 17.84375, 19.4375, 21.03125, 22.625, 24.21875, 25.8125, 27.40625, 29.0, 30.59375, 32.1875, 33.78125, 35.375, 36.96875, 38.5625, 40.15625, 41.75, 43.34375, 44.9375, 46.53125, 48.125, 49.71875, 51.3125, 52.90625, 54.5]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 271.0, 690.0, 48.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.13741302490234, -67.41154479980469, -62.68567657470703, -57.95980453491211, -53.23393630981445, -48.5080680847168, -43.782196044921875, -39.05632781982422, -34.33045959472656, -29.604591369628906, -24.878721237182617, -20.152851104736328, -15.426982879638672, -10.701114654541016, -5.975244522094727, -1.2493743896484375, 3.4764938354492188, 8.202363014221191, 12.928232192993164, 17.654102325439453, 22.37997055053711, 27.105838775634766, 31.831708908081055, 36.557579040527344, 41.283447265625, 46.009315490722656, 50.73518371582031, 55.461055755615234, 60.18692398071289, 64.91279602050781, 69.63866424560547, 74.36453247070312, 79.09040832519531, 83.81627655029297, 88.54214477539062, 93.26801300048828, 97.99388122558594, 102.71975708007812, 107.44562530517578, 112.17149353027344, 116.8973617553711, 121.62322998046875, 126.3490982055664, 131.07496643066406, 135.80084228515625, 140.52670288085938, 145.25257873535156, 149.97845458984375, 154.70431518554688, 159.43019104003906, 164.1560516357422, 168.88192749023438, 173.6077880859375, 178.3336639404297, 183.0595245361328, 187.785400390625, 192.51126098632812, 197.2371368408203, 201.96299743652344, 206.68887329101562, 211.41473388671875, 216.14060974121094, 220.86647033691406, 225.59234619140625, 230.31822204589844]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 5.0, 7.0, 8.0, 9.0, 12.0, 8.0, 11.0, 17.0, 17.0, 25.0, 26.0, 30.0, 26.0, 37.0, 38.0, 34.0, 34.0, 42.0, 37.0, 38.0, 41.0, 41.0, 46.0, 48.0, 44.0, 39.0, 49.0, 31.0, 29.0, 27.0, 25.0, 18.0, 23.0, 12.0, 14.0, 8.0, 15.0, 8.0, 5.0, 4.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-60.92143249511719, -58.97035598754883, -57.01927947998047, -55.06820297241211, -53.11712646484375, -51.16604995727539, -49.21497344970703, -47.26389694213867, -45.31282043457031, -43.36174392700195, -41.410667419433594, -39.459590911865234, -37.508514404296875, -35.557437896728516, -33.606361389160156, -31.655284881591797, -29.704206466674805, -27.753129959106445, -25.802053451538086, -23.850976943969727, -21.899900436401367, -19.948822021484375, -17.997745513916016, -16.046669006347656, -14.095593452453613, -12.144516944885254, -10.193440437316895, -8.242362976074219, -6.291286945343018, -4.3402099609375, -2.3891334533691406, -0.43805694580078125, 1.5130195617675781, 3.4640960693359375, 5.415172576904297, 7.3662495613098145, 9.317325592041016, 11.268403053283691, 13.21947956085205, 15.17055606842041, 17.121631622314453, 19.072708129882812, 21.023784637451172, 22.97486114501953, 24.92593765258789, 26.87701416015625, 28.82809066772461, 30.77916717529297, 32.730247497558594, 34.68132400512695, 36.63240051269531, 38.58347702026367, 40.53455352783203, 42.48563003540039, 44.43670654296875, 46.38778305053711, 48.33885955810547, 50.28993606567383, 52.24101257324219, 54.19208908081055, 56.143165588378906, 58.094242095947266, 60.045318603515625, 61.996395111083984, 63.947471618652344]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0, 4.0, 4.0, 1.0, 2.0, 11.0, 4.0, 8.0, 10.0, 11.0, 13.0, 14.0, 24.0, 18.0, 20.0, 20.0, 22.0, 19.0, 20.0, 30.0, 36.0, 40.0, 37.0, 25.0, 35.0, 31.0, 36.0, 54.0, 43.0, 54.0, 36.0, 36.0, 49.0, 23.0, 31.0, 16.0, 30.0, 19.0, 21.0, 14.0, 11.0, 14.0, 10.0, 8.0, 14.0, 7.0, 3.0, 7.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-7.85546875, -7.62542724609375, -7.3953857421875, -7.16534423828125, -6.935302734375, -6.70526123046875, -6.4752197265625, -6.24517822265625, -6.01513671875, -5.78509521484375, -5.5550537109375, -5.32501220703125, -5.094970703125, -4.86492919921875, -4.6348876953125, -4.40484619140625, -4.1748046875, -3.94476318359375, -3.7147216796875, -3.48468017578125, -3.254638671875, -3.02459716796875, -2.7945556640625, -2.56451416015625, -2.33447265625, -2.10443115234375, -1.8743896484375, -1.64434814453125, -1.414306640625, -1.18426513671875, -0.9542236328125, -0.72418212890625, -0.494140625, -0.26409912109375, -0.0340576171875, 0.19598388671875, 0.426025390625, 0.65606689453125, 0.8861083984375, 1.11614990234375, 1.34619140625, 1.57623291015625, 1.8062744140625, 2.03631591796875, 2.266357421875, 2.49639892578125, 2.7264404296875, 2.95648193359375, 3.1865234375, 3.41656494140625, 3.6466064453125, 3.87664794921875, 4.106689453125, 4.33673095703125, 4.5667724609375, 4.79681396484375, 5.02685546875, 5.25689697265625, 5.4869384765625, 5.71697998046875, 5.947021484375, 6.17706298828125, 6.4071044921875, 6.63714599609375, 6.8671875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 0.0, 5.0, 2.0, 4.0, 4.0, 7.0, 15.0, 16.0, 16.0, 16.0, 15.0, 24.0, 25.0, 26.0, 41.0, 64.0, 96.0, 158.0, 300.0, 615.0, 1465.0, 4843.0, 23388.0, 307826.0, 2744556.0, 1036356.0, 61740.0, 8532.0, 2284.0, 834.0, 387.0, 177.0, 134.0, 94.0, 47.0, 32.0, 23.0, 21.0, 22.0, 13.0, 9.0, 5.0, 13.0, 9.0, 8.0, 9.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-20.5, -19.909423828125, -19.31884765625, -18.728271484375, -18.1376953125, -17.547119140625, -16.95654296875, -16.365966796875, -15.775390625, -15.184814453125, -14.59423828125, -14.003662109375, -13.4130859375, -12.822509765625, -12.23193359375, -11.641357421875, -11.05078125, -10.460205078125, -9.86962890625, -9.279052734375, -8.6884765625, -8.097900390625, -7.50732421875, -6.916748046875, -6.326171875, -5.735595703125, -5.14501953125, -4.554443359375, -3.9638671875, -3.373291015625, -2.78271484375, -2.192138671875, -1.6015625, -1.010986328125, -0.42041015625, 0.170166015625, 0.7607421875, 1.351318359375, 1.94189453125, 2.532470703125, 3.123046875, 3.713623046875, 4.30419921875, 4.894775390625, 5.4853515625, 6.075927734375, 6.66650390625, 7.257080078125, 7.84765625, 8.438232421875, 9.02880859375, 9.619384765625, 10.2099609375, 10.800537109375, 11.39111328125, 11.981689453125, 12.572265625, 13.162841796875, 13.75341796875, 14.343994140625, 14.9345703125, 15.525146484375, 16.11572265625, 16.706298828125, 17.296875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 6.0, 11.0, 19.0, 23.0, 37.0, 39.0, 57.0, 55.0, 83.0, 107.0, 175.0, 215.0, 282.0, 384.0, 439.0, 454.0, 426.0, 338.0, 244.0, 158.0, 132.0, 93.0, 65.0, 56.0, 45.0, 39.0, 23.0, 16.0, 16.0, 6.0, 2.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.078125, -12.68359375, -12.2890625, -11.89453125, -11.5, -11.10546875, -10.7109375, -10.31640625, -9.921875, -9.52734375, -9.1328125, -8.73828125, -8.34375, -7.94921875, -7.5546875, -7.16015625, -6.765625, -6.37109375, -5.9765625, -5.58203125, -5.1875, -4.79296875, -4.3984375, -4.00390625, -3.609375, -3.21484375, -2.8203125, -2.42578125, -2.03125, -1.63671875, -1.2421875, -0.84765625, -0.453125, -0.05859375, 0.3359375, 0.73046875, 1.125, 1.51953125, 1.9140625, 2.30859375, 2.703125, 3.09765625, 3.4921875, 3.88671875, 4.28125, 4.67578125, 5.0703125, 5.46484375, 5.859375, 6.25390625, 6.6484375, 7.04296875, 7.4375, 7.83203125, 8.2265625, 8.62109375, 9.015625, 9.41015625, 9.8046875, 10.19921875, 10.59375, 10.98828125, 11.3828125, 11.77734375, 12.171875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 3.0, 7.0, 10.0, 10.0, 10.0, 19.0, 15.0, 24.0, 39.0, 61.0, 75.0, 100.0, 127.0, 175.0, 236.0, 417.0, 1001.0, 4263.0, 63844.0, 3579423.0, 527272.0, 13555.0, 1809.0, 640.0, 344.0, 178.0, 150.0, 109.0, 85.0, 69.0, 50.0, 34.0, 29.0, 28.0, 17.0, 10.0, 13.0, 8.0, 10.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-49.6875, -48.33544921875, -46.9833984375, -45.63134765625, -44.279296875, -42.92724609375, -41.5751953125, -40.22314453125, -38.87109375, -37.51904296875, -36.1669921875, -34.81494140625, -33.462890625, -32.11083984375, -30.7587890625, -29.40673828125, -28.0546875, -26.70263671875, -25.3505859375, -23.99853515625, -22.646484375, -21.29443359375, -19.9423828125, -18.59033203125, -17.23828125, -15.88623046875, -14.5341796875, -13.18212890625, -11.830078125, -10.47802734375, -9.1259765625, -7.77392578125, -6.421875, -5.06982421875, -3.7177734375, -2.36572265625, -1.013671875, 0.33837890625, 1.6904296875, 3.04248046875, 4.39453125, 5.74658203125, 7.0986328125, 8.45068359375, 9.802734375, 11.15478515625, 12.5068359375, 13.85888671875, 15.2109375, 16.56298828125, 17.9150390625, 19.26708984375, 20.619140625, 21.97119140625, 23.3232421875, 24.67529296875, 26.02734375, 27.37939453125, 28.7314453125, 30.08349609375, 31.435546875, 32.78759765625, 34.1396484375, 35.49169921875, 36.84375]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 29.0, 116.0, 340.0, 352.0, 143.0, 30.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.91778564453125, -260.6051025390625, -255.2924346923828, -249.97975158691406, -244.6670684814453, -239.35440063476562, -234.04171752929688, -228.72903442382812, -223.41635131835938, -218.10366821289062, -212.79100036621094, -207.4783172607422, -202.16563415527344, -196.85296630859375, -191.540283203125, -186.22760009765625, -180.91493225097656, -175.6022491455078, -170.28958129882812, -164.97689819335938, -159.66421508789062, -154.35153198242188, -149.0388641357422, -143.72618103027344, -138.41351318359375, -133.100830078125, -127.78815460205078, -122.47547912597656, -117.16279602050781, -111.8501205444336, -106.53744506835938, -101.22476196289062, -95.9120864868164, -90.59941101074219, -85.28672790527344, -79.97405242919922, -74.661376953125, -69.34869384765625, -64.03601837158203, -58.72333908081055, -53.41065979003906, -48.09798049926758, -42.785301208496094, -37.472625732421875, -32.15994644165039, -26.847267150878906, -21.534589767456055, -16.221912384033203, -10.909233093261719, -5.596554756164551, -0.2838764190673828, 5.028801918029785, 10.341480255126953, 15.654159545898438, 20.96683692932129, 26.27951431274414, 31.592193603515625, 36.90487289428711, 42.217552185058594, 47.53022766113281, 52.8429069519043, 58.15558624267578, 63.46826171875, 68.78094482421875, 74.09362030029297]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 5.0, 1.0, 4.0, 3.0, 3.0, 5.0, 7.0, 8.0, 14.0, 12.0, 9.0, 18.0, 19.0, 17.0, 29.0, 28.0, 32.0, 22.0, 31.0, 32.0, 33.0, 42.0, 42.0, 44.0, 45.0, 43.0, 29.0, 36.0, 46.0, 32.0, 36.0, 35.0, 26.0, 31.0, 29.0, 27.0, 21.0, 21.0, 12.0, 16.0, 10.0, 8.0, 8.0, 8.0, 4.0, 6.0, 6.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.677459716796875, -42.42430114746094, -41.171138763427734, -39.9179801940918, -38.664817810058594, -37.411659240722656, -36.15850067138672, -34.90534210205078, -33.65217971801758, -32.39902114868164, -31.145858764648438, -29.8927001953125, -28.63953971862793, -27.38637924194336, -26.133220672607422, -24.88006019592285, -23.62689971923828, -22.37373924255371, -21.12057876586914, -19.867420196533203, -18.614259719848633, -17.361099243164062, -16.107940673828125, -14.854780197143555, -13.601619720458984, -12.348459243774414, -11.09529972076416, -9.842140197753906, -8.588979721069336, -7.335819721221924, -6.082659721374512, -4.829500198364258, -3.5763397216796875, -2.3231797218322754, -1.0700197219848633, 0.18314027786254883, 1.436300277709961, 2.689460277557373, 3.942620277404785, 5.195779800415039, 6.448940277099609, 7.7021002769470215, 8.955260276794434, 10.208419799804688, 11.461580276489258, 12.714740753173828, 13.967900276184082, 15.221059799194336, 16.474220275878906, 17.727380752563477, 18.980541229248047, 20.233699798583984, 21.486860275268555, 22.740020751953125, 23.993179321289062, 25.246339797973633, 26.499500274658203, 27.752660751342773, 29.005821228027344, 30.25897979736328, 31.51214027404785, 32.76530075073242, 34.01845932006836, 35.27162170410156, 36.5247802734375]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 8.0, 18.0, 13.0, 16.0, 15.0, 32.0, 22.0, 25.0, 30.0, 27.0, 33.0, 40.0, 34.0, 32.0, 40.0, 47.0, 48.0, 44.0, 52.0, 37.0, 43.0, 40.0, 30.0, 34.0, 30.0, 20.0, 35.0, 18.0, 21.0, 11.0, 11.0, 16.0, 5.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.51605224609375, -8.2586669921875, -8.00128173828125, -7.743896484375, -7.48651123046875, -7.2291259765625, -6.97174072265625, -6.71435546875, -6.45697021484375, -6.1995849609375, -5.94219970703125, -5.684814453125, -5.42742919921875, -5.1700439453125, -4.91265869140625, -4.6552734375, -4.39788818359375, -4.1405029296875, -3.88311767578125, -3.625732421875, -3.36834716796875, -3.1109619140625, -2.85357666015625, -2.59619140625, -2.33880615234375, -2.0814208984375, -1.82403564453125, -1.566650390625, -1.30926513671875, -1.0518798828125, -0.79449462890625, -0.537109375, -0.27972412109375, -0.0223388671875, 0.23504638671875, 0.492431640625, 0.74981689453125, 1.0072021484375, 1.26458740234375, 1.52197265625, 1.77935791015625, 2.0367431640625, 2.29412841796875, 2.551513671875, 2.80889892578125, 3.0662841796875, 3.32366943359375, 3.5810546875, 3.83843994140625, 4.0958251953125, 4.35321044921875, 4.610595703125, 4.86798095703125, 5.1253662109375, 5.38275146484375, 5.64013671875, 5.89752197265625, 6.1549072265625, 6.41229248046875, 6.669677734375, 6.92706298828125, 7.1844482421875, 7.44183349609375, 7.69921875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 2.0, 4.0, 13.0, 13.0, 29.0, 25.0, 54.0, 82.0, 131.0, 185.0, 285.0, 445.0, 732.0, 1201.0, 2027.0, 3392.0, 5600.0, 9266.0, 15826.0, 27795.0, 48620.0, 87208.0, 154928.0, 227051.0, 195104.0, 117077.0, 64427.0, 35963.0, 20719.0, 12274.0, 7191.0, 4169.0, 2601.0, 1531.0, 980.0, 571.0, 374.0, 243.0, 142.0, 94.0, 75.0, 37.0, 22.0, 12.0, 16.0, 8.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8488540649414062, -0.8212432861328125, -0.7936325073242188, -0.766021728515625, -0.7384109497070312, -0.7108001708984375, -0.6831893920898438, -0.65557861328125, -0.6279678344726562, -0.6003570556640625, -0.5727462768554688, -0.545135498046875, -0.5175247192382812, -0.4899139404296875, -0.46230316162109375, -0.4346923828125, -0.40708160400390625, -0.3794708251953125, -0.35186004638671875, -0.324249267578125, -0.29663848876953125, -0.2690277099609375, -0.24141693115234375, -0.21380615234375, -0.18619537353515625, -0.1585845947265625, -0.13097381591796875, -0.103363037109375, -0.07575225830078125, -0.0481414794921875, -0.02053070068359375, 0.007080078125, 0.03469085693359375, 0.0623016357421875, 0.08991241455078125, 0.117523193359375, 0.14513397216796875, 0.1727447509765625, 0.20035552978515625, 0.22796630859375, 0.25557708740234375, 0.2831878662109375, 0.31079864501953125, 0.338409423828125, 0.36602020263671875, 0.3936309814453125, 0.42124176025390625, 0.4488525390625, 0.47646331787109375, 0.5040740966796875, 0.5316848754882812, 0.559295654296875, 0.5869064331054688, 0.6145172119140625, 0.6421279907226562, 0.66973876953125, 0.6973495483398438, 0.7249603271484375, 0.7525711059570312, 0.780181884765625, 0.8077926635742188, 0.8354034423828125, 0.8630142211914062, 0.890625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 5.0, 5.0, 5.0, 9.0, 17.0, 10.0, 14.0, 19.0, 23.0, 22.0, 25.0, 23.0, 26.0, 32.0, 32.0, 42.0, 41.0, 29.0, 27.0, 44.0, 1068.0, 39.0, 40.0, 47.0, 39.0, 47.0, 40.0, 25.0, 28.0, 35.0, 30.0, 22.0, 13.0, 13.0, 15.0, 15.0, 15.0, 10.0, 8.0, 6.0, 3.0, 7.0, 4.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.765625, -4.60406494140625, -4.4425048828125, -4.28094482421875, -4.119384765625, -3.95782470703125, -3.7962646484375, -3.63470458984375, -3.47314453125, -3.31158447265625, -3.1500244140625, -2.98846435546875, -2.826904296875, -2.66534423828125, -2.5037841796875, -2.34222412109375, -2.1806640625, -2.01910400390625, -1.8575439453125, -1.69598388671875, -1.534423828125, -1.37286376953125, -1.2113037109375, -1.04974365234375, -0.88818359375, -0.72662353515625, -0.5650634765625, -0.40350341796875, -0.241943359375, -0.08038330078125, 0.0811767578125, 0.24273681640625, 0.404296875, 0.56585693359375, 0.7274169921875, 0.88897705078125, 1.050537109375, 1.21209716796875, 1.3736572265625, 1.53521728515625, 1.69677734375, 1.85833740234375, 2.0198974609375, 2.18145751953125, 2.343017578125, 2.50457763671875, 2.6661376953125, 2.82769775390625, 2.9892578125, 3.15081787109375, 3.3123779296875, 3.47393798828125, 3.635498046875, 3.79705810546875, 3.9586181640625, 4.12017822265625, 4.28173828125, 4.44329833984375, 4.6048583984375, 4.76641845703125, 4.927978515625, 5.08953857421875, 5.2510986328125, 5.41265869140625, 5.57421875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 23.0, 27.0, 28.0, 59.0, 63.0, 107.0, 191.0, 296.0, 460.0, 741.0, 1285.0, 2120.0, 3518.0, 6000.0, 10191.0, 17217.0, 30297.0, 53042.0, 94900.0, 160880.0, 1265009.0, 184787.0, 114430.0, 64329.0, 36296.0, 20844.0, 12207.0, 6986.0, 4257.0, 2639.0, 1439.0, 941.0, 585.0, 366.0, 190.0, 122.0, 97.0, 59.0, 30.0, 17.0, 12.0, 10.0, 8.0, 6.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.716796875, -0.6917953491210938, -0.6667938232421875, -0.6417922973632812, -0.616790771484375, -0.5917892456054688, -0.5667877197265625, -0.5417861938476562, -0.51678466796875, -0.49178314208984375, -0.4667816162109375, -0.44178009033203125, -0.416778564453125, -0.39177703857421875, -0.3667755126953125, -0.34177398681640625, -0.3167724609375, -0.29177093505859375, -0.2667694091796875, -0.24176788330078125, -0.216766357421875, -0.19176483154296875, -0.1667633056640625, -0.14176177978515625, -0.11676025390625, -0.09175872802734375, -0.0667572021484375, -0.04175567626953125, -0.016754150390625, 0.00824737548828125, 0.0332489013671875, 0.05825042724609375, 0.083251953125, 0.10825347900390625, 0.1332550048828125, 0.15825653076171875, 0.183258056640625, 0.20825958251953125, 0.2332611083984375, 0.25826263427734375, 0.28326416015625, 0.30826568603515625, 0.3332672119140625, 0.35826873779296875, 0.383270263671875, 0.40827178955078125, 0.4332733154296875, 0.45827484130859375, 0.4832763671875, 0.5082778930664062, 0.5332794189453125, 0.5582809448242188, 0.583282470703125, 0.6082839965820312, 0.6332855224609375, 0.6582870483398438, 0.68328857421875, 0.7082901000976562, 0.7332916259765625, 0.7582931518554688, 0.783294677734375, 0.8082962036132812, 0.8332977294921875, 0.8582992553710938, 0.88330078125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 2.0, 5.0, 7.0, 10.0, 10.0, 12.0, 19.0, 17.0, 15.0, 31.0, 34.0, 29.0, 44.0, 48.0, 49.0, 63.0, 49.0, 44.0, 49.0, 47.0, 57.0, 57.0, 52.0, 48.0, 30.0, 35.0, 27.0, 22.0, 25.0, 10.0, 15.0, 2.0, 13.0, 7.0, 7.0, 8.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018968582153320312, -0.0018270164728164673, -0.0017571747303009033, -0.0016873329877853394, -0.0016174912452697754, -0.0015476495027542114, -0.0014778077602386475, -0.0014079660177230835, -0.0013381242752075195, -0.0012682825326919556, -0.0011984407901763916, -0.0011285990476608276, -0.0010587573051452637, -0.0009889155626296997, -0.0009190738201141357, -0.0008492320775985718, -0.0007793903350830078, -0.0007095485925674438, -0.0006397068500518799, -0.0005698651075363159, -0.000500023365020752, -0.000430181622505188, -0.000360339879989624, -0.00029049813747406006, -0.0002206563949584961, -0.00015081465244293213, -8.097290992736816e-05, -1.11311674118042e-05, 5.8710575103759766e-05, 0.00012855231761932373, 0.0001983940601348877, 0.00026823580265045166, 0.0003380775451660156, 0.0004079192876815796, 0.00047776103019714355, 0.0005476027727127075, 0.0006174445152282715, 0.0006872862577438354, 0.0007571280002593994, 0.0008269697427749634, 0.0008968114852905273, 0.0009666532278060913, 0.0010364949703216553, 0.0011063367128372192, 0.0011761784553527832, 0.0012460201978683472, 0.0013158619403839111, 0.001385703682899475, 0.001455545425415039, 0.001525387167930603, 0.001595228910446167, 0.001665070652961731, 0.001734912395477295, 0.0018047541379928589, 0.0018745958805084229, 0.0019444376230239868, 0.0020142793655395508, 0.0020841211080551147, 0.0021539628505706787, 0.0022238045930862427, 0.0022936463356018066, 0.0023634880781173706, 0.0024333298206329346, 0.0025031715631484985, 0.0025730133056640625]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 1.0, 9.0, 11.0, 11.0, 9.0, 22.0, 23.0, 33.0, 35.0, 54.0, 53.0, 70.0, 102.0, 138.0, 188.0, 356.0, 739.0, 4149.0, 1016141.0, 24199.0, 887.0, 416.0, 248.0, 172.0, 113.0, 73.0, 62.0, 48.0, 41.0, 30.0, 31.0, 22.0, 14.0, 11.0, 15.0, 3.0, 11.0, 2.0, 2.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.048736572265625, -0.04736900329589844, -0.046001434326171875, -0.04463386535644531, -0.04326629638671875, -0.04189872741699219, -0.040531158447265625, -0.03916358947753906, -0.0377960205078125, -0.03642845153808594, -0.035060882568359375, -0.03369331359863281, -0.03232574462890625, -0.030958175659179688, -0.029590606689453125, -0.028223037719726562, -0.02685546875, -0.025487899780273438, -0.024120330810546875, -0.022752761840820312, -0.02138519287109375, -0.020017623901367188, -0.018650054931640625, -0.017282485961914062, -0.0159149169921875, -0.014547348022460938, -0.013179779052734375, -0.011812210083007812, -0.01044464111328125, -0.009077072143554688, -0.007709503173828125, -0.0063419342041015625, -0.004974365234375, -0.0036067962646484375, -0.002239227294921875, -0.0008716583251953125, 0.00049591064453125, 0.0018634796142578125, 0.003231048583984375, 0.0045986175537109375, 0.0059661865234375, 0.0073337554931640625, 0.008701324462890625, 0.010068893432617188, 0.01143646240234375, 0.012804031372070312, 0.014171600341796875, 0.015539169311523438, 0.01690673828125, 0.018274307250976562, 0.019641876220703125, 0.021009445190429688, 0.02237701416015625, 0.023744583129882812, 0.025112152099609375, 0.026479721069335938, 0.0278472900390625, 0.029214859008789062, 0.030582427978515625, 0.03194999694824219, 0.03331756591796875, 0.03468513488769531, 0.036052703857421875, 0.03742027282714844, 0.038787841796875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [20.0, 516.0, 459.0, 22.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006244506221264601, -0.0003027369675692171, 1.8976686988025904e-05, 0.00034069037064909935, 0.0006624039961025119, 0.0009841176215559244, 0.0013058313634246588, 0.0016275448724627495, 0.0019492586143314838, 0.002270972356200218, 0.002592685865238309, 0.0029143996071070433, 0.003236113116145134, 0.0035578268580138683, 0.0038795405998826027, 0.00420125387609005, 0.004522968083620071, 0.004844681825488806, 0.00516639556735754, 0.005488108843564987, 0.0058098225854337215, 0.006131536327302456, 0.00645325006917119, 0.006774963811039925, 0.007096677087247372, 0.007418390829116106, 0.00774010457098484, 0.008061817847192287, 0.008383532054722309, 0.008705245330929756, 0.009026959538459778, 0.009348672814667225, 0.009670387022197247, 0.009992100298404694, 0.010313814505934715, 0.010635527782142162, 0.010957241989672184, 0.011278955265879631, 0.011600669473409653, 0.0119223827496171, 0.012244096025824547, 0.012565809302031994, 0.012887523509562016, 0.013209236785769463, 0.013530950993299484, 0.013852664269506931, 0.014174377545714378, 0.0144960917532444, 0.014817805960774422, 0.015139519236981869, 0.01546123344451189, 0.015782946720719337, 0.01610466092824936, 0.01642637327313423, 0.016748087480664253, 0.017069801688194275, 0.017391514033079147, 0.01771322824060917, 0.01803494058549404, 0.018356654793024063, 0.018678369000554085, 0.019000083208084106, 0.01932179555296898, 0.019643509760499, 0.019965223968029022]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 3.0, 4.0, 10.0, 11.0, 18.0, 12.0, 14.0, 14.0, 28.0, 30.0, 23.0, 39.0, 35.0, 49.0, 33.0, 49.0, 47.0, 49.0, 33.0, 57.0, 35.0, 45.0, 47.0, 30.0, 36.0, 40.0, 36.0, 24.0, 17.0, 24.0, 18.0, 17.0, 17.0, 22.0, 9.0, 4.0, 4.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013175606727600098, -0.001277254894375801, -0.0012369491159915924, -0.0011966433376073837, -0.001156337559223175, -0.0011160317808389664, -0.0010757260024547577, -0.001035420224070549, -0.0009951144456863403, -0.0009548086673021317, -0.000914502888917923, -0.0008741971105337143, -0.0008338913321495056, -0.0007935855537652969, -0.0007532797753810883, -0.0007129739969968796, -0.0006726682186126709, -0.0006323624402284622, -0.0005920566618442535, -0.0005517508834600449, -0.0005114451050758362, -0.0004711393266916275, -0.0004308335483074188, -0.00039052776992321014, -0.00035022199153900146, -0.0003099162131547928, -0.0002696104347705841, -0.00022930465638637543, -0.00018899887800216675, -0.00014869309961795807, -0.00010838732123374939, -6.808154284954071e-05, -2.777576446533203e-05, 1.2530013918876648e-05, 5.283579230308533e-05, 9.3141570687294e-05, 0.00013344734907150269, 0.00017375312745571136, 0.00021405890583992004, 0.0002543646842241287, 0.0002946704626083374, 0.0003349762409925461, 0.00037528201937675476, 0.00041558779776096344, 0.0004558935761451721, 0.0004961993545293808, 0.0005365051329135895, 0.0005768109112977982, 0.0006171166896820068, 0.0006574224680662155, 0.0006977282464504242, 0.0007380340248346329, 0.0007783398032188416, 0.0008186455816030502, 0.0008589513599872589, 0.0008992571383714676, 0.0009395629167556763, 0.000979868695139885, 0.0010201744735240936, 0.0010604802519083023, 0.001100786030292511, 0.0011410918086767197, 0.0011813975870609283, 0.001221703365445137, 0.0012620091438293457]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 4.0, 4.0, 7.0, 9.0, 10.0, 8.0, 18.0, 13.0, 16.0, 15.0, 32.0, 22.0, 25.0, 30.0, 27.0, 33.0, 40.0, 34.0, 32.0, 40.0, 47.0, 48.0, 44.0, 52.0, 37.0, 43.0, 40.0, 30.0, 34.0, 30.0, 20.0, 35.0, 17.0, 22.0, 11.0, 11.0, 16.0, 5.0, 7.0, 8.0, 6.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.51605224609375, -8.2586669921875, -8.00128173828125, -7.743896484375, -7.48651123046875, -7.2291259765625, -6.97174072265625, -6.71435546875, -6.45697021484375, -6.1995849609375, -5.94219970703125, -5.684814453125, -5.42742919921875, -5.1700439453125, -4.91265869140625, -4.6552734375, -4.39788818359375, -4.1405029296875, -3.88311767578125, -3.625732421875, -3.36834716796875, -3.1109619140625, -2.85357666015625, -2.59619140625, -2.33880615234375, -2.0814208984375, -1.82403564453125, -1.566650390625, -1.30926513671875, -1.0518798828125, -0.79449462890625, -0.537109375, -0.27972412109375, -0.0223388671875, 0.23504638671875, 0.492431640625, 0.74981689453125, 1.0072021484375, 1.26458740234375, 1.52197265625, 1.77935791015625, 2.0367431640625, 2.29412841796875, 2.551513671875, 2.80889892578125, 3.0662841796875, 3.32366943359375, 3.5810546875, 3.83843994140625, 4.0958251953125, 4.35321044921875, 4.610595703125, 4.86798095703125, 5.1253662109375, 5.38275146484375, 5.64013671875, 5.89752197265625, 6.1549072265625, 6.41229248046875, 6.669677734375, 6.92706298828125, 7.1844482421875, 7.44183349609375, 7.69921875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 5.0, 6.0, 8.0, 8.0, 10.0, 17.0, 18.0, 34.0, 47.0, 38.0, 47.0, 90.0, 107.0, 137.0, 186.0, 274.0, 316.0, 509.0, 799.0, 1602.0, 5044.0, 24400.0, 376740.0, 597630.0, 30049.0, 5858.0, 1780.0, 811.0, 530.0, 356.0, 294.0, 184.0, 134.0, 123.0, 88.0, 70.0, 36.0, 30.0, 38.0, 21.0, 18.0, 11.0, 8.0, 10.0, 9.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.140625, -21.490478515625, -20.84033203125, -20.190185546875, -19.5400390625, -18.889892578125, -18.23974609375, -17.589599609375, -16.939453125, -16.289306640625, -15.63916015625, -14.989013671875, -14.3388671875, -13.688720703125, -13.03857421875, -12.388427734375, -11.73828125, -11.088134765625, -10.43798828125, -9.787841796875, -9.1376953125, -8.487548828125, -7.83740234375, -7.187255859375, -6.537109375, -5.886962890625, -5.23681640625, -4.586669921875, -3.9365234375, -3.286376953125, -2.63623046875, -1.986083984375, -1.3359375, -0.685791015625, -0.03564453125, 0.614501953125, 1.2646484375, 1.914794921875, 2.56494140625, 3.215087890625, 3.865234375, 4.515380859375, 5.16552734375, 5.815673828125, 6.4658203125, 7.115966796875, 7.76611328125, 8.416259765625, 9.06640625, 9.716552734375, 10.36669921875, 11.016845703125, 11.6669921875, 12.317138671875, 12.96728515625, 13.617431640625, 14.267578125, 14.917724609375, 15.56787109375, 16.218017578125, 16.8681640625, 17.518310546875, 18.16845703125, 18.818603515625, 19.46875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 10.0, 8.0, 17.0, 12.0, 10.0, 20.0, 17.0, 22.0, 27.0, 23.0, 18.0, 34.0, 28.0, 44.0, 44.0, 57.0, 69.0, 211.0, 1703.0, 176.0, 80.0, 38.0, 53.0, 43.0, 40.0, 28.0, 26.0, 27.0, 27.0, 21.0, 19.0, 14.0, 10.0, 12.0, 8.0, 10.0, 8.0, 5.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 3.0], "bins": [-23.578125, -22.873779296875, -22.16943359375, -21.465087890625, -20.7607421875, -20.056396484375, -19.35205078125, -18.647705078125, -17.943359375, -17.239013671875, -16.53466796875, -15.830322265625, -15.1259765625, -14.421630859375, -13.71728515625, -13.012939453125, -12.30859375, -11.604248046875, -10.89990234375, -10.195556640625, -9.4912109375, -8.786865234375, -8.08251953125, -7.378173828125, -6.673828125, -5.969482421875, -5.26513671875, -4.560791015625, -3.8564453125, -3.152099609375, -2.44775390625, -1.743408203125, -1.0390625, -0.334716796875, 0.36962890625, 1.073974609375, 1.7783203125, 2.482666015625, 3.18701171875, 3.891357421875, 4.595703125, 5.300048828125, 6.00439453125, 6.708740234375, 7.4130859375, 8.117431640625, 8.82177734375, 9.526123046875, 10.23046875, 10.934814453125, 11.63916015625, 12.343505859375, 13.0478515625, 13.752197265625, 14.45654296875, 15.160888671875, 15.865234375, 16.569580078125, 17.27392578125, 17.978271484375, 18.6826171875, 19.386962890625, 20.09130859375, 20.795654296875, 21.5]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 6.0, 1.0, 3.0, 4.0, 3.0, 2.0, 6.0, 6.0, 12.0, 8.0, 11.0, 20.0, 9.0, 26.0, 22.0, 26.0, 30.0, 29.0, 55.0, 61.0, 90.0, 144.0, 243.0, 574.0, 4014.0, 2921371.0, 215758.0, 1979.0, 459.0, 251.0, 115.0, 69.0, 49.0, 31.0, 31.0, 32.0, 32.0, 25.0, 18.0, 16.0, 18.0, 10.0, 12.0, 10.0, 5.0, 4.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-60.15625, -58.20849609375, -56.2607421875, -54.31298828125, -52.365234375, -50.41748046875, -48.4697265625, -46.52197265625, -44.57421875, -42.62646484375, -40.6787109375, -38.73095703125, -36.783203125, -34.83544921875, -32.8876953125, -30.93994140625, -28.9921875, -27.04443359375, -25.0966796875, -23.14892578125, -21.201171875, -19.25341796875, -17.3056640625, -15.35791015625, -13.41015625, -11.46240234375, -9.5146484375, -7.56689453125, -5.619140625, -3.67138671875, -1.7236328125, 0.22412109375, 2.171875, 4.11962890625, 6.0673828125, 8.01513671875, 9.962890625, 11.91064453125, 13.8583984375, 15.80615234375, 17.75390625, 19.70166015625, 21.6494140625, 23.59716796875, 25.544921875, 27.49267578125, 29.4404296875, 31.38818359375, 33.3359375, 35.28369140625, 37.2314453125, 39.17919921875, 41.126953125, 43.07470703125, 45.0224609375, 46.97021484375, 48.91796875, 50.86572265625, 52.8134765625, 54.76123046875, 56.708984375, 58.65673828125, 60.6044921875, 62.55224609375, 64.5]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 48.0, 154.0, 381.0, 295.0, 109.0, 24.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.01274871826172, -92.23455047607422, -90.45635223388672, -88.67814636230469, -86.89994812011719, -85.12174987792969, -83.34355163574219, -81.56535339355469, -79.78714752197266, -78.00894927978516, -76.23075103759766, -74.45254516601562, -72.67434692382812, -70.89614868164062, -69.11795043945312, -67.33975219726562, -65.56155395507812, -63.783355712890625, -62.00515365600586, -60.22695541381836, -58.448753356933594, -56.670555114746094, -54.892356872558594, -53.11415481567383, -51.33595275878906, -49.55775451660156, -47.7795524597168, -46.0013542175293, -44.22315216064453, -42.44495391845703, -40.66675567626953, -38.888553619384766, -37.110347747802734, -35.332149505615234, -33.55394744873047, -31.77574920654297, -29.997547149658203, -28.219348907470703, -26.44114875793457, -24.662948608398438, -22.884748458862305, -21.106548309326172, -19.32834815979004, -17.550148010253906, -15.77194881439209, -13.993748664855957, -12.21554946899414, -10.437349319458008, -8.659149169921875, -6.880949020385742, -5.102749347686768, -3.324549674987793, -1.5463495254516602, 0.23185062408447266, 2.010049819946289, 3.788249969482422, 5.566450119018555, 7.3446502685546875, 9.12285041809082, 10.901049613952637, 12.67924976348877, 14.457449913024902, 16.23564910888672, 18.01384925842285, 19.792049407958984]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 7.0, 9.0, 7.0, 9.0, 13.0, 13.0, 17.0, 9.0, 11.0, 13.0, 24.0, 31.0, 33.0, 33.0, 28.0, 41.0, 38.0, 37.0, 40.0, 42.0, 36.0, 41.0, 44.0, 36.0, 35.0, 36.0, 28.0, 32.0, 32.0, 27.0, 21.0, 24.0, 17.0, 19.0, 19.0, 13.0, 12.0, 14.0, 13.0, 6.0, 14.0, 5.0, 5.0, 3.0, 1.0, 4.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.40106964111328, -50.55718231201172, -48.71329116821289, -46.86940383911133, -45.0255126953125, -43.18162536621094, -41.337738037109375, -39.49384689331055, -37.649959564208984, -35.80607223510742, -33.962181091308594, -32.11829376220703, -30.274404525756836, -28.43051528930664, -26.586626052856445, -24.74273681640625, -22.898847579956055, -21.05495834350586, -19.211069107055664, -17.36717987060547, -15.523292541503906, -13.679403305053711, -11.835514068603516, -9.991625785827637, -8.147736549377441, -6.303847789764404, -4.459959030151367, -2.616069793701172, -0.7721810340881348, 1.0717077255249023, 2.9155969619750977, 4.759485244750977, 6.603374481201172, 8.447263717651367, 10.291152000427246, 12.135041236877441, 13.97892951965332, 15.822818756103516, 17.66670799255371, 19.510597229003906, 21.35448455810547, 23.198373794555664, 25.04226303100586, 26.886150360107422, 28.730039596557617, 30.573928833007812, 32.417816162109375, 34.2617073059082, 36.10559844970703, 37.949485778808594, 39.79337692260742, 41.637264251708984, 43.48115539550781, 45.325042724609375, 47.16893005371094, 49.012821197509766, 50.85670852661133, 52.70059585571289, 54.54448699951172, 56.38837432861328, 58.23226547241211, 60.07615280151367, 61.9200439453125, 63.76393127441406, 65.60781860351562]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 4.0, 5.0, 3.0, 0.0, 11.0, 9.0, 12.0, 19.0, 25.0, 17.0, 26.0, 26.0, 24.0, 30.0, 28.0, 36.0, 33.0, 49.0, 24.0, 48.0, 41.0, 40.0, 54.0, 53.0, 45.0, 46.0, 48.0, 35.0, 35.0, 20.0, 25.0, 23.0, 17.0, 17.0, 13.0, 10.0, 9.0, 12.0, 5.0, 8.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4609375, -9.182861328125, -8.90478515625, -8.626708984375, -8.3486328125, -8.070556640625, -7.79248046875, -7.514404296875, -7.236328125, -6.958251953125, -6.68017578125, -6.402099609375, -6.1240234375, -5.845947265625, -5.56787109375, -5.289794921875, -5.01171875, -4.733642578125, -4.45556640625, -4.177490234375, -3.8994140625, -3.621337890625, -3.34326171875, -3.065185546875, -2.787109375, -2.509033203125, -2.23095703125, -1.952880859375, -1.6748046875, -1.396728515625, -1.11865234375, -0.840576171875, -0.5625, -0.284423828125, -0.00634765625, 0.271728515625, 0.5498046875, 0.827880859375, 1.10595703125, 1.384033203125, 1.662109375, 1.940185546875, 2.21826171875, 2.496337890625, 2.7744140625, 3.052490234375, 3.33056640625, 3.608642578125, 3.88671875, 4.164794921875, 4.44287109375, 4.720947265625, 4.9990234375, 5.277099609375, 5.55517578125, 5.833251953125, 6.111328125, 6.389404296875, 6.66748046875, 6.945556640625, 7.2236328125, 7.501708984375, 7.77978515625, 8.057861328125, 8.3359375]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 8.0, 7.0, 7.0, 11.0, 13.0, 14.0, 23.0, 28.0, 32.0, 51.0, 61.0, 67.0, 98.0, 138.0, 180.0, 272.0, 481.0, 987.0, 2107.0, 5736.0, 21317.0, 152851.0, 1463574.0, 2175165.0, 321415.0, 35678.0, 8197.0, 2807.0, 1252.0, 633.0, 330.0, 203.0, 124.0, 101.0, 63.0, 59.0, 41.0, 35.0, 30.0, 24.0, 16.0, 14.0, 13.0, 7.0, 8.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.5625, -17.0628662109375, -16.563232421875, -16.0635986328125, -15.56396484375, -15.0643310546875, -14.564697265625, -14.0650634765625, -13.5654296875, -13.0657958984375, -12.566162109375, -12.0665283203125, -11.56689453125, -11.0672607421875, -10.567626953125, -10.0679931640625, -9.568359375, -9.0687255859375, -8.569091796875, -8.0694580078125, -7.56982421875, -7.0701904296875, -6.570556640625, -6.0709228515625, -5.5712890625, -5.0716552734375, -4.572021484375, -4.0723876953125, -3.57275390625, -3.0731201171875, -2.573486328125, -2.0738525390625, -1.57421875, -1.0745849609375, -0.574951171875, -0.0753173828125, 0.42431640625, 0.9239501953125, 1.423583984375, 1.9232177734375, 2.4228515625, 2.9224853515625, 3.422119140625, 3.9217529296875, 4.42138671875, 4.9210205078125, 5.420654296875, 5.9202880859375, 6.419921875, 6.9195556640625, 7.419189453125, 7.9188232421875, 8.41845703125, 8.9180908203125, 9.417724609375, 9.9173583984375, 10.4169921875, 10.9166259765625, 11.416259765625, 11.9158935546875, 12.41552734375, 12.9151611328125, 13.414794921875, 13.9144287109375, 14.4140625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 5.0, 11.0, 14.0, 15.0, 24.0, 41.0, 62.0, 107.0, 169.0, 199.0, 348.0, 493.0, 567.0, 574.0, 453.0, 314.0, 227.0, 148.0, 88.0, 60.0, 48.0, 41.0, 12.0, 15.0, 5.0, 9.0, 5.0, 4.0, 4.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.102294921875, -8.59521484375, -8.088134765625, -7.5810546875, -7.073974609375, -6.56689453125, -6.059814453125, -5.552734375, -5.045654296875, -4.53857421875, -4.031494140625, -3.5244140625, -3.017333984375, -2.51025390625, -2.003173828125, -1.49609375, -0.989013671875, -0.48193359375, 0.025146484375, 0.5322265625, 1.039306640625, 1.54638671875, 2.053466796875, 2.560546875, 3.067626953125, 3.57470703125, 4.081787109375, 4.5888671875, 5.095947265625, 5.60302734375, 6.110107421875, 6.6171875, 7.124267578125, 7.63134765625, 8.138427734375, 8.6455078125, 9.152587890625, 9.65966796875, 10.166748046875, 10.673828125, 11.180908203125, 11.68798828125, 12.195068359375, 12.7021484375, 13.209228515625, 13.71630859375, 14.223388671875, 14.73046875, 15.237548828125, 15.74462890625, 16.251708984375, 16.7587890625, 17.265869140625, 17.77294921875, 18.280029296875, 18.787109375, 19.294189453125, 19.80126953125, 20.308349609375, 20.8154296875, 21.322509765625, 21.82958984375, 22.336669921875, 22.84375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 11.0, 13.0, 7.0, 14.0, 17.0, 28.0, 41.0, 40.0, 61.0, 81.0, 134.0, 186.0, 274.0, 509.0, 1250.0, 5662.0, 82946.0, 3706380.0, 379376.0, 13469.0, 2053.0, 676.0, 366.0, 206.0, 139.0, 102.0, 81.0, 42.0, 36.0, 30.0, 15.0, 17.0, 11.0, 4.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-49.78125, -48.42431640625, -47.0673828125, -45.71044921875, -44.353515625, -42.99658203125, -41.6396484375, -40.28271484375, -38.92578125, -37.56884765625, -36.2119140625, -34.85498046875, -33.498046875, -32.14111328125, -30.7841796875, -29.42724609375, -28.0703125, -26.71337890625, -25.3564453125, -23.99951171875, -22.642578125, -21.28564453125, -19.9287109375, -18.57177734375, -17.21484375, -15.85791015625, -14.5009765625, -13.14404296875, -11.787109375, -10.43017578125, -9.0732421875, -7.71630859375, -6.359375, -5.00244140625, -3.6455078125, -2.28857421875, -0.931640625, 0.42529296875, 1.7822265625, 3.13916015625, 4.49609375, 5.85302734375, 7.2099609375, 8.56689453125, 9.923828125, 11.28076171875, 12.6376953125, 13.99462890625, 15.3515625, 16.70849609375, 18.0654296875, 19.42236328125, 20.779296875, 22.13623046875, 23.4931640625, 24.85009765625, 26.20703125, 27.56396484375, 28.9208984375, 30.27783203125, 31.634765625, 32.99169921875, 34.3486328125, 35.70556640625, 37.0625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 14.0, 62.0, 227.0, 335.0, 264.0, 77.0, 19.0, 12.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-233.24407958984375, -228.71530151367188, -224.18653869628906, -219.6577606201172, -215.12899780273438, -210.6002197265625, -206.0714569091797, -201.5426788330078, -197.013916015625, -192.48513793945312, -187.9563751220703, -183.42759704589844, -178.89883422851562, -174.37005615234375, -169.84129333496094, -165.31251525878906, -160.78375244140625, -156.25497436523438, -151.72621154785156, -147.1974334716797, -142.66867065429688, -138.139892578125, -133.6111297607422, -129.0823516845703, -124.55357360839844, -120.0248031616211, -115.49603271484375, -110.9672622680664, -106.43849182128906, -101.90972137451172, -97.38095092773438, -92.8521728515625, -88.32340240478516, -83.79463195800781, -79.26586151123047, -74.73709106445312, -70.20832061767578, -65.67955017089844, -61.15077590942383, -56.622005462646484, -52.09323501586914, -47.5644645690918, -43.03569412231445, -38.506919860839844, -33.9781494140625, -29.44938087463379, -24.920608520507812, -20.39183807373047, -15.863067626953125, -11.334297180175781, -6.805525779724121, -2.276754379272461, 2.252016067504883, 6.780786514282227, 11.309558868408203, 15.838329315185547, 20.36709976196289, 24.895870208740234, 29.424640655517578, 33.95341491699219, 38.48218536376953, 43.010955810546875, 47.53972625732422, 52.06849670410156, 56.597267150878906]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 4.0, 3.0, 5.0, 5.0, 10.0, 11.0, 10.0, 14.0, 18.0, 27.0, 19.0, 31.0, 28.0, 39.0, 37.0, 40.0, 39.0, 36.0, 48.0, 35.0, 40.0, 41.0, 43.0, 39.0, 37.0, 42.0, 35.0, 30.0, 40.0, 24.0, 24.0, 14.0, 25.0, 22.0, 20.0, 17.0, 11.0, 10.0, 11.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.10435485839844, -42.69416809082031, -41.28398513793945, -39.87379837036133, -38.4636116027832, -37.053428649902344, -35.64324188232422, -34.233055114746094, -32.82286834716797, -31.412683486938477, -30.00249671936035, -28.59231185913086, -27.182125091552734, -25.771940231323242, -24.36175537109375, -22.951568603515625, -21.541385650634766, -20.131200790405273, -18.72101402282715, -17.310829162597656, -15.900643348693848, -14.490457534790039, -13.080272674560547, -11.670086860656738, -10.25990104675293, -8.849715232849121, -7.439529895782471, -6.02934455871582, -4.619158744812012, -3.208972930908203, -1.798788070678711, -0.38860225677490234, 1.0215835571289062, 2.4317691326141357, 3.8419547080993652, 5.252140045166016, 6.662325859069824, 8.072511672973633, 9.482696533203125, 10.892882347106934, 12.303068161010742, 13.71325397491455, 15.12343978881836, 16.53362464904785, 17.943809509277344, 19.35399627685547, 20.76418113708496, 22.174365997314453, 23.584552764892578, 24.99473762512207, 26.404924392700195, 27.815109252929688, 29.225296020507812, 30.635480880737305, 32.0456657409668, 33.45585250854492, 34.86603546142578, 36.276222229003906, 37.686405181884766, 39.09659194946289, 40.506778717041016, 41.916961669921875, 43.3271484375, 44.737335205078125, 46.14752197265625]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 2.0, 9.0, 9.0, 11.0, 15.0, 4.0, 13.0, 21.0, 15.0, 26.0, 22.0, 18.0, 21.0, 28.0, 24.0, 29.0, 34.0, 29.0, 42.0, 33.0, 47.0, 41.0, 35.0, 51.0, 49.0, 38.0, 42.0, 25.0, 27.0, 34.0, 19.0, 23.0, 23.0, 16.0, 21.0, 15.0, 10.0, 22.0, 6.0, 8.0, 6.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.609375, -8.35888671875, -8.1083984375, -7.85791015625, -7.607421875, -7.35693359375, -7.1064453125, -6.85595703125, -6.60546875, -6.35498046875, -6.1044921875, -5.85400390625, -5.603515625, -5.35302734375, -5.1025390625, -4.85205078125, -4.6015625, -4.35107421875, -4.1005859375, -3.85009765625, -3.599609375, -3.34912109375, -3.0986328125, -2.84814453125, -2.59765625, -2.34716796875, -2.0966796875, -1.84619140625, -1.595703125, -1.34521484375, -1.0947265625, -0.84423828125, -0.59375, -0.34326171875, -0.0927734375, 0.15771484375, 0.408203125, 0.65869140625, 0.9091796875, 1.15966796875, 1.41015625, 1.66064453125, 1.9111328125, 2.16162109375, 2.412109375, 2.66259765625, 2.9130859375, 3.16357421875, 3.4140625, 3.66455078125, 3.9150390625, 4.16552734375, 4.416015625, 4.66650390625, 4.9169921875, 5.16748046875, 5.41796875, 5.66845703125, 5.9189453125, 6.16943359375, 6.419921875, 6.67041015625, 6.9208984375, 7.17138671875, 7.421875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 6.0, 5.0, 7.0, 15.0, 22.0, 36.0, 63.0, 107.0, 153.0, 235.0, 368.0, 599.0, 1001.0, 1727.0, 2870.0, 5027.0, 8548.0, 14675.0, 25204.0, 44065.0, 78592.0, 136400.0, 207394.0, 207261.0, 134331.0, 76983.0, 43119.0, 24867.0, 14409.0, 8428.0, 4832.0, 2911.0, 1646.0, 1034.0, 592.0, 391.0, 247.0, 136.0, 111.0, 50.0, 30.0, 22.0, 15.0, 11.0, 7.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.923828125, -0.8958206176757812, -0.8678131103515625, -0.8398056030273438, -0.811798095703125, -0.7837905883789062, -0.7557830810546875, -0.7277755737304688, -0.69976806640625, -0.6717605590820312, -0.6437530517578125, -0.6157455444335938, -0.587738037109375, -0.5597305297851562, -0.5317230224609375, -0.5037155151367188, -0.4757080078125, -0.44770050048828125, -0.4196929931640625, -0.39168548583984375, -0.363677978515625, -0.33567047119140625, -0.3076629638671875, -0.27965545654296875, -0.25164794921875, -0.22364044189453125, -0.1956329345703125, -0.16762542724609375, -0.139617919921875, -0.11161041259765625, -0.0836029052734375, -0.05559539794921875, -0.027587890625, 0.00041961669921875, 0.0284271240234375, 0.05643463134765625, 0.084442138671875, 0.11244964599609375, 0.1404571533203125, 0.16846466064453125, 0.19647216796875, 0.22447967529296875, 0.2524871826171875, 0.28049468994140625, 0.308502197265625, 0.33650970458984375, 0.3645172119140625, 0.39252471923828125, 0.4205322265625, 0.44853973388671875, 0.4765472412109375, 0.5045547485351562, 0.532562255859375, 0.5605697631835938, 0.5885772705078125, 0.6165847778320312, 0.64459228515625, 0.6725997924804688, 0.7006072998046875, 0.7286148071289062, 0.756622314453125, 0.7846298217773438, 0.8126373291015625, 0.8406448364257812, 0.86865234375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 1.0, 5.0, 5.0, 14.0, 14.0, 14.0, 16.0, 15.0, 35.0, 31.0, 33.0, 39.0, 43.0, 48.0, 43.0, 46.0, 39.0, 1075.0, 41.0, 58.0, 50.0, 41.0, 41.0, 42.0, 26.0, 32.0, 37.0, 28.0, 24.0, 22.0, 17.0, 13.0, 9.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.82421875, -6.6234130859375, -6.422607421875, -6.2218017578125, -6.02099609375, -5.8201904296875, -5.619384765625, -5.4185791015625, -5.2177734375, -5.0169677734375, -4.816162109375, -4.6153564453125, -4.41455078125, -4.2137451171875, -4.012939453125, -3.8121337890625, -3.611328125, -3.4105224609375, -3.209716796875, -3.0089111328125, -2.80810546875, -2.6072998046875, -2.406494140625, -2.2056884765625, -2.0048828125, -1.8040771484375, -1.603271484375, -1.4024658203125, -1.20166015625, -1.0008544921875, -0.800048828125, -0.5992431640625, -0.3984375, -0.1976318359375, 0.003173828125, 0.2039794921875, 0.40478515625, 0.6055908203125, 0.806396484375, 1.0072021484375, 1.2080078125, 1.4088134765625, 1.609619140625, 1.8104248046875, 2.01123046875, 2.2120361328125, 2.412841796875, 2.6136474609375, 2.814453125, 3.0152587890625, 3.216064453125, 3.4168701171875, 3.61767578125, 3.8184814453125, 4.019287109375, 4.2200927734375, 4.4208984375, 4.6217041015625, 4.822509765625, 5.0233154296875, 5.22412109375, 5.4249267578125, 5.625732421875, 5.8265380859375, 6.02734375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 9.0, 2.0, 10.0, 9.0, 15.0, 29.0, 32.0, 54.0, 84.0, 117.0, 165.0, 281.0, 444.0, 771.0, 1069.0, 1818.0, 2934.0, 4722.0, 7696.0, 12709.0, 21936.0, 38805.0, 68242.0, 119697.0, 187688.0, 1260616.0, 153635.0, 90427.0, 51260.0, 29156.0, 16899.0, 9862.0, 6087.0, 3553.0, 2283.0, 1372.0, 965.0, 609.0, 394.0, 252.0, 149.0, 99.0, 64.0, 39.0, 31.0, 17.0, 18.0, 9.0, 1.0, 2.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.830078125, -0.80511474609375, -0.7801513671875, -0.75518798828125, -0.730224609375, -0.70526123046875, -0.6802978515625, -0.65533447265625, -0.63037109375, -0.60540771484375, -0.5804443359375, -0.55548095703125, -0.530517578125, -0.50555419921875, -0.4805908203125, -0.45562744140625, -0.4306640625, -0.40570068359375, -0.3807373046875, -0.35577392578125, -0.330810546875, -0.30584716796875, -0.2808837890625, -0.25592041015625, -0.23095703125, -0.20599365234375, -0.1810302734375, -0.15606689453125, -0.131103515625, -0.10614013671875, -0.0811767578125, -0.05621337890625, -0.03125, -0.00628662109375, 0.0186767578125, 0.04364013671875, 0.068603515625, 0.09356689453125, 0.1185302734375, 0.14349365234375, 0.16845703125, 0.19342041015625, 0.2183837890625, 0.24334716796875, 0.268310546875, 0.29327392578125, 0.3182373046875, 0.34320068359375, 0.3681640625, 0.39312744140625, 0.4180908203125, 0.44305419921875, 0.468017578125, 0.49298095703125, 0.5179443359375, 0.54290771484375, 0.56787109375, 0.59283447265625, 0.6177978515625, 0.64276123046875, 0.667724609375, 0.69268798828125, 0.7176513671875, 0.74261474609375, 0.767578125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 4.0, 3.0, 6.0, 5.0, 4.0, 3.0, 4.0, 10.0, 9.0, 13.0, 9.0, 16.0, 17.0, 16.0, 13.0, 30.0, 20.0, 31.0, 29.0, 28.0, 35.0, 33.0, 38.0, 32.0, 47.0, 38.0, 35.0, 32.0, 29.0, 46.0, 40.0, 31.0, 25.0, 30.0, 33.0, 20.0, 24.0, 23.0, 21.0, 20.0, 18.0, 16.0, 10.0, 15.0, 11.0, 6.0, 4.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0], "bins": [-0.0018472671508789062, -0.001788705587387085, -0.0017301440238952637, -0.0016715824604034424, -0.001613020896911621, -0.0015544593334197998, -0.0014958977699279785, -0.0014373362064361572, -0.001378774642944336, -0.0013202130794525146, -0.0012616515159606934, -0.001203089952468872, -0.0011445283889770508, -0.0010859668254852295, -0.0010274052619934082, -0.0009688436985015869, -0.0009102821350097656, -0.0008517205715179443, -0.000793159008026123, -0.0007345974445343018, -0.0006760358810424805, -0.0006174743175506592, -0.0005589127540588379, -0.0005003511905670166, -0.0004417896270751953, -0.000383228063583374, -0.00032466650009155273, -0.00026610493659973145, -0.00020754337310791016, -0.00014898180961608887, -9.042024612426758e-05, -3.185868263244629e-05, 2.6702880859375e-05, 8.526444435119629e-05, 0.00014382600784301758, 0.00020238757133483887, 0.00026094913482666016, 0.00031951069831848145, 0.00037807226181030273, 0.000436633825302124, 0.0004951953887939453, 0.0005537569522857666, 0.0006123185157775879, 0.0006708800792694092, 0.0007294416427612305, 0.0007880032062530518, 0.000846564769744873, 0.0009051263332366943, 0.0009636878967285156, 0.001022249460220337, 0.0010808110237121582, 0.0011393725872039795, 0.0011979341506958008, 0.001256495714187622, 0.0013150572776794434, 0.0013736188411712646, 0.001432180404663086, 0.0014907419681549072, 0.0015493035316467285, 0.0016078650951385498, 0.001666426658630371, 0.0017249882221221924, 0.0017835497856140137, 0.001842111349105835, 0.0019006729125976562]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 4.0, 9.0, 7.0, 11.0, 9.0, 7.0, 19.0, 17.0, 35.0, 23.0, 31.0, 32.0, 48.0, 55.0, 47.0, 80.0, 108.0, 130.0, 188.0, 253.0, 436.0, 704.0, 5212.0, 886158.0, 151476.0, 1503.0, 575.0, 359.0, 200.0, 180.0, 117.0, 112.0, 73.0, 38.0, 45.0, 35.0, 36.0, 24.0, 29.0, 21.0, 14.0, 19.0, 10.0, 15.0, 9.0, 7.0, 11.0, 4.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0], "bins": [-0.037445068359375, -0.03626728057861328, -0.03508949279785156, -0.033911705017089844, -0.032733917236328125, -0.031556129455566406, -0.030378341674804688, -0.02920055389404297, -0.02802276611328125, -0.02684497833251953, -0.025667190551757812, -0.024489402770996094, -0.023311614990234375, -0.022133827209472656, -0.020956039428710938, -0.01977825164794922, -0.0186004638671875, -0.01742267608642578, -0.016244888305664062, -0.015067100524902344, -0.013889312744140625, -0.012711524963378906, -0.011533737182617188, -0.010355949401855469, -0.00917816162109375, -0.008000373840332031, -0.0068225860595703125, -0.005644798278808594, -0.004467010498046875, -0.0032892227172851562, -0.0021114349365234375, -0.0009336471557617188, 0.000244140625, 0.0014219284057617188, 0.0025997161865234375, 0.0037775039672851562, 0.004955291748046875, 0.006133079528808594, 0.0073108673095703125, 0.008488655090332031, 0.00966644287109375, 0.010844230651855469, 0.012022018432617188, 0.013199806213378906, 0.014377593994140625, 0.015555381774902344, 0.016733169555664062, 0.01791095733642578, 0.0190887451171875, 0.02026653289794922, 0.021444320678710938, 0.022622108459472656, 0.023799896240234375, 0.024977684020996094, 0.026155471801757812, 0.02733325958251953, 0.02851104736328125, 0.02968883514404297, 0.030866622924804688, 0.032044410705566406, 0.033222198486328125, 0.034399986267089844, 0.03557777404785156, 0.03675556182861328, 0.037933349609375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [8.0, 10.0, 35.0, 137.0, 264.0, 340.0, 164.0, 45.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007205752190202475, -0.0005811104201711714, -0.0004416456213220954, -0.00030218082247301936, -0.00016271602362394333, -2.3251224774867296e-05, 0.00011621357407420874, 0.00025567837292328477, 0.0003951431717723608, 0.0005346079706214368, 0.0006740727694705129, 0.0008135375683195889, 0.0009530023671686649, 0.0010924672242254019, 0.001231931964866817, 0.0013713967055082321, 0.001510861562564969, 0.001650326419621706, 0.0017897911602631211, 0.0019292559009045362, 0.002068720757961273, 0.00220818561501801, 0.002347650472074747, 0.0024871150963008404, 0.0026265799533575773, 0.0027660448104143143, 0.0029055094346404076, 0.0030449742916971445, 0.0031844391487538815, 0.0033239040058106184, 0.0034633688628673553, 0.0036028334870934486, 0.003742298111319542, 0.003881762968376279, 0.004021227825433016, 0.004160692449659109, 0.00430015753954649, 0.004439622163772583, 0.004579086787998676, 0.004718551877886057, 0.00485801650211215, 0.0049974811263382435, 0.005136946216225624, 0.005276410840451717, 0.005415875464677811, 0.005555340554565191, 0.0056948051787912846, 0.005834270268678665, 0.0059737348929047585, 0.006113199517130852, 0.006252664607018232, 0.006392129231244326, 0.006531594321131706, 0.0066710589453577995, 0.006810523569583893, 0.006949988659471273, 0.007089453283697367, 0.00722891790792346, 0.007368382997810841, 0.007507847622036934, 0.007647312246263027, 0.007786777336150408, 0.007926242426037788, 0.008065707050263882, 0.008205171674489975]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 4.0, 2.0, 3.0, 3.0, 5.0, 3.0, 13.0, 9.0, 17.0, 6.0, 14.0, 16.0, 25.0, 24.0, 35.0, 36.0, 40.0, 29.0, 34.0, 50.0, 47.0, 42.0, 37.0, 48.0, 51.0, 53.0, 35.0, 44.0, 32.0, 29.0, 29.0, 25.0, 15.0, 28.0, 20.0, 15.0, 19.0, 14.0, 10.0, 15.0, 9.0, 3.0, 10.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0016497969627380371, -0.0016045374795794487, -0.0015592779964208603, -0.0015140185132622719, -0.0014687590301036835, -0.001423499546945095, -0.0013782400637865067, -0.0013329805806279182, -0.0012877210974693298, -0.0012424616143107414, -0.001197202131152153, -0.0011519426479935646, -0.0011066831648349762, -0.0010614236816763878, -0.0010161641985177994, -0.000970904715359211, -0.0009256452322006226, -0.0008803857490420341, -0.0008351262658834457, -0.0007898667827248573, -0.0007446072995662689, -0.0006993478164076805, -0.0006540883332490921, -0.0006088288500905037, -0.0005635693669319153, -0.0005183098837733269, -0.00047305040061473846, -0.00042779091745615005, -0.00038253143429756165, -0.00033727195113897324, -0.0002920124679803848, -0.0002467529848217964, -0.000201493501663208, -0.0001562340185046196, -0.00011097453534603119, -6.571505218744278e-05, -2.045556902885437e-05, 2.480391412973404e-05, 7.006339728832245e-05, 0.00011532288044691086, 0.00016058236360549927, 0.00020584184676408768, 0.0002511013299226761, 0.0002963608130812645, 0.0003416202962398529, 0.0003868797793984413, 0.0004321392625570297, 0.00047739874571561813, 0.0005226582288742065, 0.000567917712032795, 0.0006131771951913834, 0.0006584366783499718, 0.0007036961615085602, 0.0007489556446671486, 0.000794215127825737, 0.0008394746109843254, 0.0008847340941429138, 0.0009299935773015022, 0.0009752530604600906, 0.001020512543618679, 0.0010657720267772675, 0.0011110315099358559, 0.0011562909930944443, 0.0012015504762530327, 0.001246809959411621]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 2.0, 4.0, 2.0, 9.0, 9.0, 11.0, 15.0, 4.0, 13.0, 21.0, 15.0, 26.0, 22.0, 18.0, 21.0, 28.0, 24.0, 29.0, 34.0, 29.0, 42.0, 33.0, 47.0, 41.0, 35.0, 51.0, 49.0, 38.0, 42.0, 25.0, 27.0, 34.0, 19.0, 23.0, 23.0, 16.0, 21.0, 15.0, 10.0, 22.0, 6.0, 8.0, 6.0, 9.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.609375, -8.35888671875, -8.1083984375, -7.85791015625, -7.607421875, -7.35693359375, -7.1064453125, -6.85595703125, -6.60546875, -6.35498046875, -6.1044921875, -5.85400390625, -5.603515625, -5.35302734375, -5.1025390625, -4.85205078125, -4.6015625, -4.35107421875, -4.1005859375, -3.85009765625, -3.599609375, -3.34912109375, -3.0986328125, -2.84814453125, -2.59765625, -2.34716796875, -2.0966796875, -1.84619140625, -1.595703125, -1.34521484375, -1.0947265625, -0.84423828125, -0.59375, -0.34326171875, -0.0927734375, 0.15771484375, 0.408203125, 0.65869140625, 0.9091796875, 1.15966796875, 1.41015625, 1.66064453125, 1.9111328125, 2.16162109375, 2.412109375, 2.66259765625, 2.9130859375, 3.16357421875, 3.4140625, 3.66455078125, 3.9150390625, 4.16552734375, 4.416015625, 4.66650390625, 4.9169921875, 5.16748046875, 5.41796875, 5.66845703125, 5.9189453125, 6.16943359375, 6.419921875, 6.67041015625, 6.9208984375, 7.17138671875, 7.421875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 9.0, 9.0, 8.0, 9.0, 15.0, 24.0, 20.0, 29.0, 42.0, 34.0, 58.0, 73.0, 81.0, 129.0, 176.0, 275.0, 377.0, 597.0, 1119.0, 2108.0, 4118.0, 8671.0, 20558.0, 54314.0, 162937.0, 460956.0, 216099.0, 68506.0, 25793.0, 10719.0, 4767.0, 2462.0, 1262.0, 718.0, 453.0, 247.0, 183.0, 140.0, 102.0, 85.0, 58.0, 57.0, 41.0, 25.0, 25.0, 13.0, 16.0, 11.0, 8.0, 7.0, 5.0, 2.0, 2.0, 0.0, 3.0], "bins": [-11.1171875, -10.7960205078125, -10.474853515625, -10.1536865234375, -9.83251953125, -9.5113525390625, -9.190185546875, -8.8690185546875, -8.5478515625, -8.2266845703125, -7.905517578125, -7.5843505859375, -7.26318359375, -6.9420166015625, -6.620849609375, -6.2996826171875, -5.978515625, -5.6573486328125, -5.336181640625, -5.0150146484375, -4.69384765625, -4.3726806640625, -4.051513671875, -3.7303466796875, -3.4091796875, -3.0880126953125, -2.766845703125, -2.4456787109375, -2.12451171875, -1.8033447265625, -1.482177734375, -1.1610107421875, -0.83984375, -0.5186767578125, -0.197509765625, 0.1236572265625, 0.44482421875, 0.7659912109375, 1.087158203125, 1.4083251953125, 1.7294921875, 2.0506591796875, 2.371826171875, 2.6929931640625, 3.01416015625, 3.3353271484375, 3.656494140625, 3.9776611328125, 4.298828125, 4.6199951171875, 4.941162109375, 5.2623291015625, 5.58349609375, 5.9046630859375, 6.225830078125, 6.5469970703125, 6.8681640625, 7.1893310546875, 7.510498046875, 7.8316650390625, 8.15283203125, 8.4739990234375, 8.795166015625, 9.1163330078125, 9.4375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 3.0, 5.0, 12.0, 11.0, 12.0, 11.0, 17.0, 21.0, 32.0, 35.0, 33.0, 32.0, 45.0, 46.0, 83.0, 91.0, 121.0, 1594.0, 303.0, 126.0, 77.0, 55.0, 59.0, 44.0, 42.0, 24.0, 24.0, 28.0, 15.0, 8.0, 6.0, 8.0, 8.0, 9.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-34.3125, -33.405029296875, -32.49755859375, -31.590087890625, -30.6826171875, -29.775146484375, -28.86767578125, -27.960205078125, -27.052734375, -26.145263671875, -25.23779296875, -24.330322265625, -23.4228515625, -22.515380859375, -21.60791015625, -20.700439453125, -19.79296875, -18.885498046875, -17.97802734375, -17.070556640625, -16.1630859375, -15.255615234375, -14.34814453125, -13.440673828125, -12.533203125, -11.625732421875, -10.71826171875, -9.810791015625, -8.9033203125, -7.995849609375, -7.08837890625, -6.180908203125, -5.2734375, -4.365966796875, -3.45849609375, -2.551025390625, -1.6435546875, -0.736083984375, 0.17138671875, 1.078857421875, 1.986328125, 2.893798828125, 3.80126953125, 4.708740234375, 5.6162109375, 6.523681640625, 7.43115234375, 8.338623046875, 9.24609375, 10.153564453125, 11.06103515625, 11.968505859375, 12.8759765625, 13.783447265625, 14.69091796875, 15.598388671875, 16.505859375, 17.413330078125, 18.32080078125, 19.228271484375, 20.1357421875, 21.043212890625, 21.95068359375, 22.858154296875, 23.765625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 5.0, 5.0, 9.0, 21.0, 20.0, 23.0, 33.0, 41.0, 65.0, 87.0, 134.0, 189.0, 321.0, 631.0, 2751.0, 45532.0, 2919502.0, 168450.0, 5804.0, 865.0, 398.0, 233.0, 156.0, 119.0, 83.0, 49.0, 53.0, 33.0, 24.0, 19.0, 15.0, 7.0, 4.0, 7.0, 8.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.34375, -40.0380859375, -38.732421875, -37.4267578125, -36.12109375, -34.8154296875, -33.509765625, -32.2041015625, -30.8984375, -29.5927734375, -28.287109375, -26.9814453125, -25.67578125, -24.3701171875, -23.064453125, -21.7587890625, -20.453125, -19.1474609375, -17.841796875, -16.5361328125, -15.23046875, -13.9248046875, -12.619140625, -11.3134765625, -10.0078125, -8.7021484375, -7.396484375, -6.0908203125, -4.78515625, -3.4794921875, -2.173828125, -0.8681640625, 0.4375, 1.7431640625, 3.048828125, 4.3544921875, 5.66015625, 6.9658203125, 8.271484375, 9.5771484375, 10.8828125, 12.1884765625, 13.494140625, 14.7998046875, 16.10546875, 17.4111328125, 18.716796875, 20.0224609375, 21.328125, 22.6337890625, 23.939453125, 25.2451171875, 26.55078125, 27.8564453125, 29.162109375, 30.4677734375, 31.7734375, 33.0791015625, 34.384765625, 35.6904296875, 36.99609375, 38.3017578125, 39.607421875, 40.9130859375, 42.21875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 63.0, 330.0, 492.0, 122.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.62489318847656, -204.62548828125, -200.62606811523438, -196.6266632080078, -192.6272430419922, -188.62783813476562, -184.62841796875, -180.62901306152344, -176.62960815429688, -172.6302032470703, -168.6307830810547, -164.63137817382812, -160.6319580078125, -156.63255310058594, -152.6331329345703, -148.63372802734375, -144.63430786132812, -140.63490295410156, -136.63548278808594, -132.63607788085938, -128.63665771484375, -124.63725280761719, -120.6378402709961, -116.638427734375, -112.6390151977539, -108.63960266113281, -104.64019012451172, -100.64077758789062, -96.64137268066406, -92.64195251464844, -88.64254760742188, -84.64313507080078, -80.64372253417969, -76.6443099975586, -72.6448974609375, -68.6454849243164, -64.64607238769531, -60.646663665771484, -56.647254943847656, -52.64784240722656, -48.648433685302734, -44.64902114868164, -40.64961242675781, -36.65019989013672, -32.650787353515625, -28.65137481689453, -24.65196418762207, -20.65255355834961, -16.653141021728516, -12.653729438781738, -8.654317855834961, -4.654906272888184, -0.6554946899414062, 3.3439178466796875, 7.343328475952148, 11.34273910522461, 15.342151641845703, 19.341564178466797, 23.340974807739258, 27.34038543701172, 31.339797973632812, 35.339210510253906, 39.338623046875, 43.33803176879883, 47.33744430541992]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 6.0, 7.0, 5.0, 3.0, 7.0, 10.0, 12.0, 8.0, 18.0, 21.0, 15.0, 24.0, 32.0, 27.0, 28.0, 38.0, 40.0, 36.0, 47.0, 39.0, 39.0, 47.0, 38.0, 38.0, 38.0, 39.0, 52.0, 39.0, 34.0, 23.0, 30.0, 24.0, 24.0, 24.0, 20.0, 17.0, 13.0, 9.0, 5.0, 6.0, 5.0, 4.0, 1.0, 3.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-50.9552001953125, -49.37029266357422, -47.78538513183594, -46.200477600097656, -44.615570068359375, -43.030662536621094, -41.44575500488281, -39.86084747314453, -38.27593994140625, -36.69103240966797, -35.10612487792969, -33.521217346191406, -31.936309814453125, -30.351402282714844, -28.766494750976562, -27.18158721923828, -25.596677780151367, -24.011770248413086, -22.426862716674805, -20.841955184936523, -19.257047653198242, -17.67214012145996, -16.087230682373047, -14.502324104309082, -12.9174165725708, -11.33250904083252, -9.747601509094238, -8.16269302368164, -6.577785968780518, -4.992878437042236, -3.407970428466797, -1.8230628967285156, -0.23815536499023438, 1.3467522859573364, 2.9316599369049072, 4.516567707061768, 6.101475238800049, 7.68638277053833, 9.27129077911377, 10.85619831085205, 12.441105842590332, 14.026013374328613, 15.610920906066895, 17.195829391479492, 18.780736923217773, 20.365644454956055, 21.950551986694336, 23.535459518432617, 25.1203670501709, 26.70527458190918, 28.29018211364746, 29.875089645385742, 31.459997177124023, 33.04490661621094, 34.62981414794922, 36.2147216796875, 37.79962921142578, 39.38453674316406, 40.969444274902344, 42.554351806640625, 44.139259338378906, 45.72416687011719, 47.30907440185547, 48.89398193359375, 50.47888946533203]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 4.0, 5.0, 6.0, 9.0, 4.0, 15.0, 10.0, 13.0, 16.0, 18.0, 26.0, 19.0, 20.0, 29.0, 23.0, 23.0, 32.0, 47.0, 42.0, 32.0, 36.0, 42.0, 55.0, 45.0, 48.0, 48.0, 29.0, 36.0, 30.0, 38.0, 25.0, 31.0, 14.0, 13.0, 24.0, 18.0, 18.0, 14.0, 7.0, 3.0, 6.0, 5.0, 5.0, 5.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-9.53125, -9.25823974609375, -8.9852294921875, -8.71221923828125, -8.439208984375, -8.16619873046875, -7.8931884765625, -7.62017822265625, -7.34716796875, -7.07415771484375, -6.8011474609375, -6.52813720703125, -6.255126953125, -5.98211669921875, -5.7091064453125, -5.43609619140625, -5.1630859375, -4.89007568359375, -4.6170654296875, -4.34405517578125, -4.071044921875, -3.79803466796875, -3.5250244140625, -3.25201416015625, -2.97900390625, -2.70599365234375, -2.4329833984375, -2.15997314453125, -1.886962890625, -1.61395263671875, -1.3409423828125, -1.06793212890625, -0.794921875, -0.52191162109375, -0.2489013671875, 0.02410888671875, 0.297119140625, 0.57012939453125, 0.8431396484375, 1.11614990234375, 1.38916015625, 1.66217041015625, 1.9351806640625, 2.20819091796875, 2.481201171875, 2.75421142578125, 3.0272216796875, 3.30023193359375, 3.5732421875, 3.84625244140625, 4.1192626953125, 4.39227294921875, 4.665283203125, 4.93829345703125, 5.2113037109375, 5.48431396484375, 5.75732421875, 6.03033447265625, 6.3033447265625, 6.57635498046875, 6.849365234375, 7.12237548828125, 7.3953857421875, 7.66839599609375, 7.94140625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 6.0, 8.0, 5.0, 12.0, 7.0, 10.0, 12.0, 18.0, 10.0, 18.0, 24.0, 30.0, 34.0, 52.0, 103.0, 159.0, 365.0, 941.0, 3075.0, 15829.0, 245994.0, 2670152.0, 1186044.0, 61198.0, 6988.0, 1871.0, 643.0, 273.0, 103.0, 68.0, 55.0, 28.0, 25.0, 28.0, 8.0, 18.0, 13.0, 10.0, 6.0, 7.0, 9.0, 6.0, 5.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-22.078125, -21.443115234375, -20.80810546875, -20.173095703125, -19.5380859375, -18.903076171875, -18.26806640625, -17.633056640625, -16.998046875, -16.363037109375, -15.72802734375, -15.093017578125, -14.4580078125, -13.822998046875, -13.18798828125, -12.552978515625, -11.91796875, -11.282958984375, -10.64794921875, -10.012939453125, -9.3779296875, -8.742919921875, -8.10791015625, -7.472900390625, -6.837890625, -6.202880859375, -5.56787109375, -4.932861328125, -4.2978515625, -3.662841796875, -3.02783203125, -2.392822265625, -1.7578125, -1.122802734375, -0.48779296875, 0.147216796875, 0.7822265625, 1.417236328125, 2.05224609375, 2.687255859375, 3.322265625, 3.957275390625, 4.59228515625, 5.227294921875, 5.8623046875, 6.497314453125, 7.13232421875, 7.767333984375, 8.40234375, 9.037353515625, 9.67236328125, 10.307373046875, 10.9423828125, 11.577392578125, 12.21240234375, 12.847412109375, 13.482421875, 14.117431640625, 14.75244140625, 15.387451171875, 16.0224609375, 16.657470703125, 17.29248046875, 17.927490234375, 18.5625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 6.0, 8.0, 7.0, 15.0, 5.0, 20.0, 19.0, 28.0, 32.0, 50.0, 62.0, 83.0, 129.0, 192.0, 228.0, 353.0, 439.0, 472.0, 466.0, 396.0, 286.0, 235.0, 162.0, 90.0, 85.0, 50.0, 38.0, 26.0, 26.0, 16.0, 9.0, 13.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.5859375, -11.22216796875, -10.8583984375, -10.49462890625, -10.130859375, -9.76708984375, -9.4033203125, -9.03955078125, -8.67578125, -8.31201171875, -7.9482421875, -7.58447265625, -7.220703125, -6.85693359375, -6.4931640625, -6.12939453125, -5.765625, -5.40185546875, -5.0380859375, -4.67431640625, -4.310546875, -3.94677734375, -3.5830078125, -3.21923828125, -2.85546875, -2.49169921875, -2.1279296875, -1.76416015625, -1.400390625, -1.03662109375, -0.6728515625, -0.30908203125, 0.0546875, 0.41845703125, 0.7822265625, 1.14599609375, 1.509765625, 1.87353515625, 2.2373046875, 2.60107421875, 2.96484375, 3.32861328125, 3.6923828125, 4.05615234375, 4.419921875, 4.78369140625, 5.1474609375, 5.51123046875, 5.875, 6.23876953125, 6.6025390625, 6.96630859375, 7.330078125, 7.69384765625, 8.0576171875, 8.42138671875, 8.78515625, 9.14892578125, 9.5126953125, 9.87646484375, 10.240234375, 10.60400390625, 10.9677734375, 11.33154296875, 11.6953125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 5.0, 7.0, 9.0, 12.0, 17.0, 16.0, 21.0, 23.0, 33.0, 55.0, 88.0, 161.0, 250.0, 509.0, 1341.0, 4453.0, 20304.0, 136025.0, 2324146.0, 1586187.0, 98873.0, 15719.0, 3627.0, 1195.0, 489.0, 222.0, 137.0, 94.0, 65.0, 50.0, 40.0, 20.0, 15.0, 16.0, 18.0, 4.0, 12.0, 10.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-23.765625, -23.065185546875, -22.36474609375, -21.664306640625, -20.9638671875, -20.263427734375, -19.56298828125, -18.862548828125, -18.162109375, -17.461669921875, -16.76123046875, -16.060791015625, -15.3603515625, -14.659912109375, -13.95947265625, -13.259033203125, -12.55859375, -11.858154296875, -11.15771484375, -10.457275390625, -9.7568359375, -9.056396484375, -8.35595703125, -7.655517578125, -6.955078125, -6.254638671875, -5.55419921875, -4.853759765625, -4.1533203125, -3.452880859375, -2.75244140625, -2.052001953125, -1.3515625, -0.651123046875, 0.04931640625, 0.749755859375, 1.4501953125, 2.150634765625, 2.85107421875, 3.551513671875, 4.251953125, 4.952392578125, 5.65283203125, 6.353271484375, 7.0537109375, 7.754150390625, 8.45458984375, 9.155029296875, 9.85546875, 10.555908203125, 11.25634765625, 11.956787109375, 12.6572265625, 13.357666015625, 14.05810546875, 14.758544921875, 15.458984375, 16.159423828125, 16.85986328125, 17.560302734375, 18.2607421875, 18.961181640625, 19.66162109375, 20.362060546875, 21.0625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 28.0, 150.0, 315.0, 304.0, 143.0, 52.0, 11.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-199.92689514160156, -196.01365661621094, -192.10040283203125, -188.18716430664062, -184.27392578125, -180.36068725585938, -176.4474334716797, -172.53419494628906, -168.62095642089844, -164.7077178955078, -160.79446411132812, -156.8812255859375, -152.96798706054688, -149.05474853515625, -145.14149475097656, -141.22825622558594, -137.31500244140625, -133.40176391601562, -129.48851013183594, -125.57527160644531, -121.66203308105469, -117.74878692626953, -113.83554077148438, -109.92230224609375, -106.00906372070312, -102.09581756591797, -98.18257904052734, -94.26933288574219, -90.35609436035156, -86.4428482055664, -82.52960205078125, -78.61636352539062, -74.703125, -70.78987884521484, -66.87664031982422, -62.96339416503906, -59.05015563964844, -55.13690948486328, -51.22366714477539, -47.3104248046875, -43.397178649902344, -39.48393630981445, -35.57069396972656, -31.65744972229004, -27.74420738220215, -23.830965042114258, -19.917720794677734, -16.004478454589844, -12.091236114501953, -8.177993774414062, -4.2647504806518555, -0.35150718688964844, 3.561735153198242, 7.474977493286133, 11.388221740722656, 15.301464080810547, 19.214706420898438, 23.127948760986328, 27.04119110107422, 30.954435348510742, 34.86767578125, 38.780921936035156, 42.69416427612305, 46.60740661621094, 50.52064895629883]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 0.0, 5.0, 5.0, 8.0, 11.0, 10.0, 16.0, 13.0, 16.0, 23.0, 12.0, 22.0, 24.0, 20.0, 46.0, 39.0, 46.0, 38.0, 44.0, 33.0, 40.0, 35.0, 36.0, 43.0, 49.0, 30.0, 37.0, 32.0, 33.0, 35.0, 28.0, 19.0, 32.0, 24.0, 17.0, 14.0, 11.0, 15.0, 10.0, 6.0, 7.0, 3.0, 9.0, 1.0, 3.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-40.77088928222656, -39.532928466796875, -38.29496765136719, -37.0570068359375, -35.81904602050781, -34.58108139038086, -33.34312057495117, -32.105159759521484, -30.867198944091797, -29.62923812866211, -28.391277313232422, -27.1533145904541, -25.915353775024414, -24.677392959594727, -23.439430236816406, -22.20146942138672, -20.96350860595703, -19.725547790527344, -18.487586975097656, -17.249624252319336, -16.01166343688965, -14.773702621459961, -13.535740852355957, -12.297779083251953, -11.059818267822266, -9.821857452392578, -8.583895683288574, -7.3459343910217285, -6.107973098754883, -4.870011806488037, -3.6320505142211914, -2.3940887451171875, -1.1561279296875, 0.0818333625793457, 1.3197946548461914, 2.557755947113037, 3.795717239379883, 5.0336785316467285, 6.271639823913574, 7.509601593017578, 8.747562408447266, 9.985523223876953, 11.223484992980957, 12.461446762084961, 13.699407577514648, 14.937368392944336, 16.175331115722656, 17.413291931152344, 18.65125274658203, 19.88921356201172, 21.127174377441406, 22.365137100219727, 23.603097915649414, 24.8410587310791, 26.079021453857422, 27.31698226928711, 28.554943084716797, 29.792903900146484, 31.030864715576172, 32.26882553100586, 33.50679016113281, 34.7447509765625, 35.98271179199219, 37.220672607421875, 38.45863342285156]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 6.0, 2.0, 6.0, 7.0, 6.0, 9.0, 4.0, 12.0, 11.0, 16.0, 16.0, 22.0, 18.0, 24.0, 22.0, 33.0, 29.0, 29.0, 32.0, 41.0, 44.0, 39.0, 40.0, 45.0, 46.0, 43.0, 38.0, 43.0, 38.0, 26.0, 36.0, 32.0, 19.0, 28.0, 23.0, 14.0, 18.0, 14.0, 15.0, 8.0, 12.0, 2.0, 8.0, 11.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.0234375, -8.7607421875, -8.498046875, -8.2353515625, -7.97265625, -7.7099609375, -7.447265625, -7.1845703125, -6.921875, -6.6591796875, -6.396484375, -6.1337890625, -5.87109375, -5.6083984375, -5.345703125, -5.0830078125, -4.8203125, -4.5576171875, -4.294921875, -4.0322265625, -3.76953125, -3.5068359375, -3.244140625, -2.9814453125, -2.71875, -2.4560546875, -2.193359375, -1.9306640625, -1.66796875, -1.4052734375, -1.142578125, -0.8798828125, -0.6171875, -0.3544921875, -0.091796875, 0.1708984375, 0.43359375, 0.6962890625, 0.958984375, 1.2216796875, 1.484375, 1.7470703125, 2.009765625, 2.2724609375, 2.53515625, 2.7978515625, 3.060546875, 3.3232421875, 3.5859375, 3.8486328125, 4.111328125, 4.3740234375, 4.63671875, 4.8994140625, 5.162109375, 5.4248046875, 5.6875, 5.9501953125, 6.212890625, 6.4755859375, 6.73828125, 7.0009765625, 7.263671875, 7.5263671875, 7.7890625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 9.0, 10.0, 24.0, 40.0, 58.0, 75.0, 129.0, 172.0, 282.0, 380.0, 570.0, 895.0, 1360.0, 2074.0, 3204.0, 4965.0, 7589.0, 12093.0, 18621.0, 28754.0, 44817.0, 69618.0, 105725.0, 149930.0, 172249.0, 142865.0, 99338.0, 65410.0, 41859.0, 26502.0, 17182.0, 11178.0, 7167.0, 4654.0, 3029.0, 2012.0, 1249.0, 819.0, 563.0, 327.0, 259.0, 168.0, 119.0, 72.0, 40.0, 38.0, 20.0, 16.0, 10.0, 9.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.6748046875, -0.6533279418945312, -0.6318511962890625, -0.6103744506835938, -0.588897705078125, -0.5674209594726562, -0.5459442138671875, -0.5244674682617188, -0.50299072265625, -0.48151397705078125, -0.4600372314453125, -0.43856048583984375, -0.417083740234375, -0.39560699462890625, -0.3741302490234375, -0.35265350341796875, -0.3311767578125, -0.30970001220703125, -0.2882232666015625, -0.26674652099609375, -0.245269775390625, -0.22379302978515625, -0.2023162841796875, -0.18083953857421875, -0.15936279296875, -0.13788604736328125, -0.1164093017578125, -0.09493255615234375, -0.073455810546875, -0.05197906494140625, -0.0305023193359375, -0.00902557373046875, 0.012451171875, 0.03392791748046875, 0.0554046630859375, 0.07688140869140625, 0.098358154296875, 0.11983489990234375, 0.1413116455078125, 0.16278839111328125, 0.18426513671875, 0.20574188232421875, 0.2272186279296875, 0.24869537353515625, 0.270172119140625, 0.29164886474609375, 0.3131256103515625, 0.33460235595703125, 0.3560791015625, 0.37755584716796875, 0.3990325927734375, 0.42050933837890625, 0.441986083984375, 0.46346282958984375, 0.4849395751953125, 0.5064163208007812, 0.52789306640625, 0.5493698120117188, 0.5708465576171875, 0.5923233032226562, 0.613800048828125, 0.6352767944335938, 0.6567535400390625, 0.6782302856445312, 0.69970703125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 9.0, 14.0, 12.0, 7.0, 16.0, 12.0, 25.0, 35.0, 32.0, 29.0, 34.0, 34.0, 40.0, 47.0, 54.0, 38.0, 46.0, 1060.0, 65.0, 38.0, 43.0, 27.0, 37.0, 37.0, 33.0, 31.0, 26.0, 22.0, 23.0, 14.0, 24.0, 12.0, 8.0, 9.0, 8.0, 8.0, 2.0, 2.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.91015625, -6.71954345703125, -6.5289306640625, -6.33831787109375, -6.147705078125, -5.95709228515625, -5.7664794921875, -5.57586669921875, -5.38525390625, -5.19464111328125, -5.0040283203125, -4.81341552734375, -4.622802734375, -4.43218994140625, -4.2415771484375, -4.05096435546875, -3.8603515625, -3.66973876953125, -3.4791259765625, -3.28851318359375, -3.097900390625, -2.90728759765625, -2.7166748046875, -2.52606201171875, -2.33544921875, -2.14483642578125, -1.9542236328125, -1.76361083984375, -1.572998046875, -1.38238525390625, -1.1917724609375, -1.00115966796875, -0.810546875, -0.61993408203125, -0.4293212890625, -0.23870849609375, -0.048095703125, 0.14251708984375, 0.3331298828125, 0.52374267578125, 0.71435546875, 0.90496826171875, 1.0955810546875, 1.28619384765625, 1.476806640625, 1.66741943359375, 1.8580322265625, 2.04864501953125, 2.2392578125, 2.42987060546875, 2.6204833984375, 2.81109619140625, 3.001708984375, 3.19232177734375, 3.3829345703125, 3.57354736328125, 3.76416015625, 3.95477294921875, 4.1453857421875, 4.33599853515625, 4.526611328125, 4.71722412109375, 4.9078369140625, 5.09844970703125, 5.2890625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 18.0, 20.0, 37.0, 40.0, 62.0, 99.0, 146.0, 247.0, 369.0, 523.0, 928.0, 1323.0, 2043.0, 3190.0, 5004.0, 8044.0, 12915.0, 21528.0, 36304.0, 60561.0, 101698.0, 157464.0, 1244217.0, 165880.0, 109228.0, 66040.0, 38706.0, 22787.0, 14034.0, 8606.0, 5392.0, 3428.0, 2273.0, 1380.0, 896.0, 600.0, 366.0, 253.0, 168.0, 101.0, 66.0, 44.0, 25.0, 13.0, 19.0, 15.0, 7.0, 7.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7119140625, -0.688629150390625, -0.66534423828125, -0.642059326171875, -0.6187744140625, -0.595489501953125, -0.57220458984375, -0.548919677734375, -0.525634765625, -0.502349853515625, -0.47906494140625, -0.455780029296875, -0.4324951171875, -0.409210205078125, -0.38592529296875, -0.362640380859375, -0.33935546875, -0.316070556640625, -0.29278564453125, -0.269500732421875, -0.2462158203125, -0.222930908203125, -0.19964599609375, -0.176361083984375, -0.153076171875, -0.129791259765625, -0.10650634765625, -0.083221435546875, -0.0599365234375, -0.036651611328125, -0.01336669921875, 0.009918212890625, 0.033203125, 0.056488037109375, 0.07977294921875, 0.103057861328125, 0.1263427734375, 0.149627685546875, 0.17291259765625, 0.196197509765625, 0.219482421875, 0.242767333984375, 0.26605224609375, 0.289337158203125, 0.3126220703125, 0.335906982421875, 0.35919189453125, 0.382476806640625, 0.40576171875, 0.429046630859375, 0.45233154296875, 0.475616455078125, 0.4989013671875, 0.522186279296875, 0.54547119140625, 0.568756103515625, 0.592041015625, 0.615325927734375, 0.63861083984375, 0.661895751953125, 0.6851806640625, 0.708465576171875, 0.73175048828125, 0.755035400390625, 0.7783203125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 9.0, 8.0, 10.0, 11.0, 13.0, 26.0, 23.0, 21.0, 28.0, 39.0, 38.0, 30.0, 45.0, 60.0, 29.0, 48.0, 40.0, 63.0, 56.0, 44.0, 51.0, 50.0, 36.0, 26.0, 32.0, 29.0, 19.0, 17.0, 23.0, 14.0, 5.0, 11.0, 6.0, 9.0, 3.0, 3.0, 3.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0018863677978515625, -0.001826852560043335, -0.0017673373222351074, -0.0017078220844268799, -0.0016483068466186523, -0.0015887916088104248, -0.0015292763710021973, -0.0014697611331939697, -0.0014102458953857422, -0.0013507306575775146, -0.0012912154197692871, -0.0012317001819610596, -0.001172184944152832, -0.0011126697063446045, -0.001053154468536377, -0.0009936392307281494, -0.0009341239929199219, -0.0008746087551116943, -0.0008150935173034668, -0.0007555782794952393, -0.0006960630416870117, -0.0006365478038787842, -0.0005770325660705566, -0.0005175173282623291, -0.00045800209045410156, -0.000398486852645874, -0.0003389716148376465, -0.00027945637702941895, -0.0002199411392211914, -0.00016042590141296387, -0.00010091066360473633, -4.139542579650879e-05, 1.811981201171875e-05, 7.763504981994629e-05, 0.00013715028762817383, 0.00019666552543640137, 0.0002561807632446289, 0.00031569600105285645, 0.000375211238861084, 0.0004347264766693115, 0.0004942417144775391, 0.0005537569522857666, 0.0006132721900939941, 0.0006727874279022217, 0.0007323026657104492, 0.0007918179035186768, 0.0008513331413269043, 0.0009108483791351318, 0.0009703636169433594, 0.001029878854751587, 0.0010893940925598145, 0.001148909330368042, 0.0012084245681762695, 0.001267939805984497, 0.0013274550437927246, 0.0013869702816009521, 0.0014464855194091797, 0.0015060007572174072, 0.0015655159950256348, 0.0016250312328338623, 0.0016845464706420898, 0.0017440617084503174, 0.001803576946258545, 0.0018630921840667725, 0.001922607421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 7.0, 8.0, 14.0, 6.0, 13.0, 13.0, 25.0, 29.0, 27.0, 42.0, 39.0, 51.0, 76.0, 98.0, 123.0, 196.0, 288.0, 468.0, 899.0, 26892.0, 1008290.0, 8709.0, 834.0, 424.0, 243.0, 146.0, 131.0, 93.0, 81.0, 59.0, 56.0, 34.0, 19.0, 26.0, 23.0, 7.0, 10.0, 12.0, 7.0, 3.0, 5.0, 9.0, 1.0, 3.0, 1.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.03607177734375, -0.034923553466796875, -0.03377532958984375, -0.032627105712890625, -0.0314788818359375, -0.030330657958984375, -0.02918243408203125, -0.028034210205078125, -0.026885986328125, -0.025737762451171875, -0.02458953857421875, -0.023441314697265625, -0.0222930908203125, -0.021144866943359375, -0.01999664306640625, -0.018848419189453125, -0.0177001953125, -0.016551971435546875, -0.01540374755859375, -0.014255523681640625, -0.0131072998046875, -0.011959075927734375, -0.01081085205078125, -0.009662628173828125, -0.008514404296875, -0.007366180419921875, -0.00621795654296875, -0.005069732666015625, -0.0039215087890625, -0.002773284912109375, -0.00162506103515625, -0.000476837158203125, 0.00067138671875, 0.001819610595703125, 0.00296783447265625, 0.004116058349609375, 0.0052642822265625, 0.006412506103515625, 0.00756072998046875, 0.008708953857421875, 0.009857177734375, 0.011005401611328125, 0.01215362548828125, 0.013301849365234375, 0.0144500732421875, 0.015598297119140625, 0.01674652099609375, 0.017894744873046875, 0.01904296875, 0.020191192626953125, 0.02133941650390625, 0.022487640380859375, 0.0236358642578125, 0.024784088134765625, 0.02593231201171875, 0.027080535888671875, 0.028228759765625, 0.029376983642578125, 0.03052520751953125, 0.031673431396484375, 0.0328216552734375, 0.033969879150390625, 0.03511810302734375, 0.036266326904296875, 0.03741455078125]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 52.0, 272.0, 504.0, 162.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002896495396271348, -0.002707128180190921, -0.0025177609641104937, -0.0023283937480300665, -0.0021390265319496393, -0.0019496593158692122, -0.0017602919833734632, -0.001570924767293036, -0.0013815575512126088, -0.0011921903351321816, -0.0010028231190517545, -0.0008134558447636664, -0.0006240886286832392, -0.00043472141260281205, -0.00024535413831472397, -5.59869222342968e-05, 0.00013338029384613037, 0.00032274750992655754, 0.0005121147260069847, 0.0007014820002950728, 0.0008908492163755, 0.0010802163742482662, 0.0012695837067440152, 0.0014589509228244424, 0.0016483181389048696, 0.0018376853549852967, 0.0020270526874810457, 0.002216419903561473, 0.0024057871196419, 0.0025951543357223272, 0.0027845215518027544, 0.0029738887678831816, 0.0031632562167942524, 0.0033526234328746796, 0.0035419906489551067, 0.003731357865035534, 0.003920725081115961, 0.004110092297196388, 0.004299459513276815, 0.004488826729357243, 0.00467819394543767, 0.004867561161518097, 0.005056928377598524, 0.005246295593678951, 0.005435662809759378, 0.005625030025839806, 0.005814397241920233, 0.00600376445800066, 0.006193132139742374, 0.006382499355822802, 0.006571866571903229, 0.006761233787983656, 0.006950601004064083, 0.00713996822014451, 0.0073293354362249374, 0.007518702652305365, 0.007708069868385792, 0.007897437550127506, 0.008086804300546646, 0.00827617198228836, 0.0084655387327075, 0.008654906414449215, 0.008844273164868355, 0.00903364084661007, 0.00922300759702921]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 3.0, 5.0, 5.0, 7.0, 11.0, 7.0, 6.0, 10.0, 9.0, 15.0, 26.0, 29.0, 24.0, 30.0, 28.0, 27.0, 36.0, 23.0, 44.0, 33.0, 38.0, 35.0, 44.0, 47.0, 36.0, 37.0, 47.0, 30.0, 33.0, 22.0, 27.0, 29.0, 31.0, 21.0, 19.0, 16.0, 17.0, 17.0, 13.0, 13.0, 12.0, 8.0, 9.0, 3.0, 2.0, 4.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.000975191593170166, -0.0009447075426578522, -0.0009142234921455383, -0.0008837394416332245, -0.0008532553911209106, -0.0008227713406085968, -0.000792287290096283, -0.0007618032395839691, -0.0007313191890716553, -0.0007008351385593414, -0.0006703510880470276, -0.0006398670375347137, -0.0006093829870223999, -0.0005788989365100861, -0.0005484148859977722, -0.0005179308354854584, -0.00048744678497314453, -0.0004569627344608307, -0.00042647868394851685, -0.000395994633436203, -0.00036551058292388916, -0.0003350265324115753, -0.0003045424818992615, -0.00027405843138694763, -0.0002435743808746338, -0.00021309033036231995, -0.0001826062798500061, -0.00015212222933769226, -0.00012163817882537842, -9.115412831306458e-05, -6.067007780075073e-05, -3.018602728843689e-05, 2.980232238769531e-07, 3.0782073736190796e-05, 6.126612424850464e-05, 9.175017476081848e-05, 0.00012223422527313232, 0.00015271827578544617, 0.00018320232629776, 0.00021368637681007385, 0.0002441704273223877, 0.00027465447783470154, 0.0003051385283470154, 0.0003356225788593292, 0.00036610662937164307, 0.0003965906798839569, 0.00042707473039627075, 0.0004575587809085846, 0.00048804283142089844, 0.0005185268819332123, 0.0005490109324455261, 0.00057949498295784, 0.0006099790334701538, 0.0006404630839824677, 0.0006709471344947815, 0.0007014311850070953, 0.0007319152355194092, 0.000762399286031723, 0.0007928833365440369, 0.0008233673870563507, 0.0008538514375686646, 0.0008843354880809784, 0.0009148195385932922, 0.0009453035891056061, 0.0009757876396179199]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 2.0, 2.0, 6.0, 2.0, 6.0, 7.0, 6.0, 9.0, 4.0, 12.0, 11.0, 16.0, 16.0, 22.0, 18.0, 24.0, 22.0, 33.0, 29.0, 29.0, 32.0, 41.0, 44.0, 39.0, 40.0, 45.0, 46.0, 43.0, 38.0, 43.0, 37.0, 27.0, 36.0, 32.0, 19.0, 28.0, 23.0, 14.0, 18.0, 14.0, 15.0, 8.0, 12.0, 2.0, 8.0, 11.0, 4.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-9.0234375, -8.7607421875, -8.498046875, -8.2353515625, -7.97265625, -7.7099609375, -7.447265625, -7.1845703125, -6.921875, -6.6591796875, -6.396484375, -6.1337890625, -5.87109375, -5.6083984375, -5.345703125, -5.0830078125, -4.8203125, -4.5576171875, -4.294921875, -4.0322265625, -3.76953125, -3.5068359375, -3.244140625, -2.9814453125, -2.71875, -2.4560546875, -2.193359375, -1.9306640625, -1.66796875, -1.4052734375, -1.142578125, -0.8798828125, -0.6171875, -0.3544921875, -0.091796875, 0.1708984375, 0.43359375, 0.6962890625, 0.958984375, 1.2216796875, 1.484375, 1.7470703125, 2.009765625, 2.2724609375, 2.53515625, 2.7978515625, 3.060546875, 3.3232421875, 3.5859375, 3.8486328125, 4.111328125, 4.3740234375, 4.63671875, 4.8994140625, 5.162109375, 5.4248046875, 5.6875, 5.9501953125, 6.212890625, 6.4755859375, 6.73828125, 7.0009765625, 7.263671875, 7.5263671875, 7.7890625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 8.0, 8.0, 11.0, 20.0, 17.0, 27.0, 31.0, 45.0, 65.0, 87.0, 116.0, 145.0, 213.0, 307.0, 513.0, 828.0, 1509.0, 3077.0, 6934.0, 17198.0, 48620.0, 162031.0, 461960.0, 237154.0, 67400.0, 22910.0, 8862.0, 3819.0, 1839.0, 959.0, 603.0, 351.0, 238.0, 159.0, 137.0, 94.0, 67.0, 50.0, 36.0, 24.0, 23.0, 24.0, 11.0, 3.0, 5.0, 9.0, 4.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-11.7578125, -11.4083251953125, -11.058837890625, -10.7093505859375, -10.35986328125, -10.0103759765625, -9.660888671875, -9.3114013671875, -8.9619140625, -8.6124267578125, -8.262939453125, -7.9134521484375, -7.56396484375, -7.2144775390625, -6.864990234375, -6.5155029296875, -6.166015625, -5.8165283203125, -5.467041015625, -5.1175537109375, -4.76806640625, -4.4185791015625, -4.069091796875, -3.7196044921875, -3.3701171875, -3.0206298828125, -2.671142578125, -2.3216552734375, -1.97216796875, -1.6226806640625, -1.273193359375, -0.9237060546875, -0.57421875, -0.2247314453125, 0.124755859375, 0.4742431640625, 0.82373046875, 1.1732177734375, 1.522705078125, 1.8721923828125, 2.2216796875, 2.5711669921875, 2.920654296875, 3.2701416015625, 3.61962890625, 3.9691162109375, 4.318603515625, 4.6680908203125, 5.017578125, 5.3670654296875, 5.716552734375, 6.0660400390625, 6.41552734375, 6.7650146484375, 7.114501953125, 7.4639892578125, 7.8134765625, 8.1629638671875, 8.512451171875, 8.8619384765625, 9.21142578125, 9.5609130859375, 9.910400390625, 10.2598876953125, 10.609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 7.0, 2.0, 5.0, 1.0, 7.0, 10.0, 9.0, 11.0, 10.0, 14.0, 13.0, 26.0, 27.0, 25.0, 36.0, 35.0, 41.0, 42.0, 58.0, 64.0, 100.0, 195.0, 1403.0, 299.0, 133.0, 82.0, 51.0, 50.0, 38.0, 32.0, 31.0, 22.0, 34.0, 22.0, 19.0, 17.0, 18.0, 14.0, 7.0, 13.0, 6.0, 4.0, 9.0, 2.0, 1.0, 6.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.671875, -17.013671875, -16.35546875, -15.697265625, -15.0390625, -14.380859375, -13.72265625, -13.064453125, -12.40625, -11.748046875, -11.08984375, -10.431640625, -9.7734375, -9.115234375, -8.45703125, -7.798828125, -7.140625, -6.482421875, -5.82421875, -5.166015625, -4.5078125, -3.849609375, -3.19140625, -2.533203125, -1.875, -1.216796875, -0.55859375, 0.099609375, 0.7578125, 1.416015625, 2.07421875, 2.732421875, 3.390625, 4.048828125, 4.70703125, 5.365234375, 6.0234375, 6.681640625, 7.33984375, 7.998046875, 8.65625, 9.314453125, 9.97265625, 10.630859375, 11.2890625, 11.947265625, 12.60546875, 13.263671875, 13.921875, 14.580078125, 15.23828125, 15.896484375, 16.5546875, 17.212890625, 17.87109375, 18.529296875, 19.1875, 19.845703125, 20.50390625, 21.162109375, 21.8203125, 22.478515625, 23.13671875, 23.794921875, 24.453125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 8.0, 3.0, 5.0, 8.0, 10.0, 9.0, 10.0, 8.0, 20.0, 22.0, 32.0, 32.0, 57.0, 81.0, 111.0, 120.0, 179.0, 296.0, 530.0, 1285.0, 12017.0, 780704.0, 2327550.0, 19185.0, 1672.0, 565.0, 361.0, 224.0, 140.0, 107.0, 80.0, 64.0, 54.0, 38.0, 30.0, 22.0, 13.0, 9.0, 9.0, 16.0, 10.0, 5.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-41.3125, -40.134765625, -38.95703125, -37.779296875, -36.6015625, -35.423828125, -34.24609375, -33.068359375, -31.890625, -30.712890625, -29.53515625, -28.357421875, -27.1796875, -26.001953125, -24.82421875, -23.646484375, -22.46875, -21.291015625, -20.11328125, -18.935546875, -17.7578125, -16.580078125, -15.40234375, -14.224609375, -13.046875, -11.869140625, -10.69140625, -9.513671875, -8.3359375, -7.158203125, -5.98046875, -4.802734375, -3.625, -2.447265625, -1.26953125, -0.091796875, 1.0859375, 2.263671875, 3.44140625, 4.619140625, 5.796875, 6.974609375, 8.15234375, 9.330078125, 10.5078125, 11.685546875, 12.86328125, 14.041015625, 15.21875, 16.396484375, 17.57421875, 18.751953125, 19.9296875, 21.107421875, 22.28515625, 23.462890625, 24.640625, 25.818359375, 26.99609375, 28.173828125, 29.3515625, 30.529296875, 31.70703125, 32.884765625, 34.0625]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 622.0, 389.0, 2.0], "bins": [-767.1044311523438, -754.7151489257812, -742.3258666992188, -729.9365844726562, -717.5473022460938, -705.1580200195312, -692.7687377929688, -680.3794555664062, -667.9901733398438, -655.6008911132812, -643.2116088867188, -630.8223266601562, -618.4330444335938, -606.0437622070312, -593.6544799804688, -581.2651977539062, -568.8759765625, -556.4866943359375, -544.097412109375, -531.7081298828125, -519.31884765625, -506.9295654296875, -494.540283203125, -482.1510009765625, -469.76171875, -457.3724365234375, -444.983154296875, -432.5938720703125, -420.20458984375, -407.8153076171875, -395.426025390625, -383.0367431640625, -370.6474609375, -358.2581787109375, -345.868896484375, -333.4796142578125, -321.09033203125, -308.7010498046875, -296.311767578125, -283.9224853515625, -271.5332336425781, -259.1439514160156, -246.75466918945312, -234.36538696289062, -221.97610473632812, -209.58682250976562, -197.1975555419922, -184.8082733154297, -172.41897583007812, -160.02969360351562, -147.64041137695312, -135.25112915039062, -122.86185455322266, -110.47257232666016, -98.08329772949219, -85.69401550292969, -73.30474090576172, -60.91545867919922, -48.526180267333984, -36.13690185546875, -23.74761962890625, -11.35833740234375, 1.0309371948242188, 13.420219421386719, 25.80950355529785]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 5.0, 1.0, 4.0, 7.0, 3.0, 1.0, 3.0, 4.0, 12.0, 6.0, 15.0, 12.0, 11.0, 18.0, 17.0, 23.0, 21.0, 30.0, 27.0, 24.0, 43.0, 41.0, 34.0, 41.0, 47.0, 37.0, 39.0, 24.0, 34.0, 38.0, 41.0, 33.0, 43.0, 38.0, 32.0, 18.0, 19.0, 22.0, 28.0, 22.0, 13.0, 18.0, 18.0, 9.0, 3.0, 7.0, 5.0, 6.0, 2.0, 5.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.839996337890625, -39.34733581542969, -37.85467529296875, -36.36201095581055, -34.86935043334961, -33.37668991088867, -31.884029388427734, -30.391366958618164, -28.898704528808594, -27.406044006347656, -25.913381576538086, -24.42072105407715, -22.928058624267578, -21.43539810180664, -19.942737579345703, -18.450075149536133, -16.957414627075195, -15.464753150939941, -13.972091674804688, -12.47943115234375, -10.98676872253418, -9.494108200073242, -8.001446723937988, -6.508785247802734, -5.0161237716674805, -3.5234622955322266, -2.0308010578155518, -0.538139820098877, 0.954521656036377, 2.447183132171631, 3.9398441314697266, 5.4325056076049805, 6.925167083740234, 8.417828559875488, 9.910490036010742, 11.40315055847168, 12.89581298828125, 14.388473510742188, 15.881134986877441, 17.373796463012695, 18.866458892822266, 20.359119415283203, 21.851781845092773, 23.34444236755371, 24.83710479736328, 26.32976531982422, 27.822425842285156, 29.315088272094727, 30.807748794555664, 32.300411224365234, 33.79307174682617, 35.28573226928711, 36.77839279174805, 38.27105712890625, 39.76371765136719, 41.256378173828125, 42.74903869628906, 44.24169921875, 45.73435974121094, 47.22702407836914, 48.71968460083008, 50.212345123291016, 51.70500564575195, 53.197669982910156, 54.690330505371094]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 3.0, 10.0, 6.0, 19.0, 11.0, 17.0, 18.0, 19.0, 21.0, 24.0, 22.0, 26.0, 36.0, 42.0, 40.0, 45.0, 32.0, 50.0, 43.0, 51.0, 41.0, 42.0, 45.0, 44.0, 42.0, 30.0, 26.0, 37.0, 30.0, 20.0, 15.0, 12.0, 10.0, 18.0, 8.0, 5.0, 6.0, 8.0, 6.0, 1.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-10.4453125, -10.15234375, -9.859375, -9.56640625, -9.2734375, -8.98046875, -8.6875, -8.39453125, -8.1015625, -7.80859375, -7.515625, -7.22265625, -6.9296875, -6.63671875, -6.34375, -6.05078125, -5.7578125, -5.46484375, -5.171875, -4.87890625, -4.5859375, -4.29296875, -4.0, -3.70703125, -3.4140625, -3.12109375, -2.828125, -2.53515625, -2.2421875, -1.94921875, -1.65625, -1.36328125, -1.0703125, -0.77734375, -0.484375, -0.19140625, 0.1015625, 0.39453125, 0.6875, 0.98046875, 1.2734375, 1.56640625, 1.859375, 2.15234375, 2.4453125, 2.73828125, 3.03125, 3.32421875, 3.6171875, 3.91015625, 4.203125, 4.49609375, 4.7890625, 5.08203125, 5.375, 5.66796875, 5.9609375, 6.25390625, 6.546875, 6.83984375, 7.1328125, 7.42578125, 7.71875, 8.01171875, 8.3046875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 6.0, 10.0, 9.0, 14.0, 11.0, 12.0, 23.0, 30.0, 31.0, 40.0, 46.0, 63.0, 94.0, 146.0, 166.0, 207.0, 296.0, 398.0, 628.0, 186758.0, 4002731.0, 810.0, 440.0, 314.0, 247.0, 175.0, 134.0, 104.0, 82.0, 55.0, 33.0, 33.0, 25.0, 27.0, 14.0, 12.0, 7.0, 10.0, 9.0, 7.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-191.625, -186.166015625, -180.70703125, -175.248046875, -169.7890625, -164.330078125, -158.87109375, -153.412109375, -147.953125, -142.494140625, -137.03515625, -131.576171875, -126.1171875, -120.658203125, -115.19921875, -109.740234375, -104.28125, -98.822265625, -93.36328125, -87.904296875, -82.4453125, -76.986328125, -71.52734375, -66.068359375, -60.609375, -55.150390625, -49.69140625, -44.232421875, -38.7734375, -33.314453125, -27.85546875, -22.396484375, -16.9375, -11.478515625, -6.01953125, -0.560546875, 4.8984375, 10.357421875, 15.81640625, 21.275390625, 26.734375, 32.193359375, 37.65234375, 43.111328125, 48.5703125, 54.029296875, 59.48828125, 64.947265625, 70.40625, 75.865234375, 81.32421875, 86.783203125, 92.2421875, 97.701171875, 103.16015625, 108.619140625, 114.078125, 119.537109375, 124.99609375, 130.455078125, 135.9140625, 141.373046875, 146.83203125, 152.291015625, 157.75]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 12.0, 11.0, 12.0, 10.0, 21.0, 21.0, 33.0, 32.0, 47.0, 53.0, 63.0, 76.0, 138.0, 196.0, 285.0, 414.0, 520.0, 572.0, 483.0, 330.0, 211.0, 162.0, 93.0, 70.0, 52.0, 34.0, 18.0, 32.0, 16.0, 11.0, 10.0, 5.0, 8.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2109375, -11.8184814453125, -11.426025390625, -11.0335693359375, -10.64111328125, -10.2486572265625, -9.856201171875, -9.4637451171875, -9.0712890625, -8.6788330078125, -8.286376953125, -7.8939208984375, -7.50146484375, -7.1090087890625, -6.716552734375, -6.3240966796875, -5.931640625, -5.5391845703125, -5.146728515625, -4.7542724609375, -4.36181640625, -3.9693603515625, -3.576904296875, -3.1844482421875, -2.7919921875, -2.3995361328125, -2.007080078125, -1.6146240234375, -1.22216796875, -0.8297119140625, -0.437255859375, -0.0447998046875, 0.34765625, 0.7401123046875, 1.132568359375, 1.5250244140625, 1.91748046875, 2.3099365234375, 2.702392578125, 3.0948486328125, 3.4873046875, 3.8797607421875, 4.272216796875, 4.6646728515625, 5.05712890625, 5.4495849609375, 5.842041015625, 6.2344970703125, 6.626953125, 7.0194091796875, 7.411865234375, 7.8043212890625, 8.19677734375, 8.5892333984375, 8.981689453125, 9.3741455078125, 9.7666015625, 10.1590576171875, 10.551513671875, 10.9439697265625, 11.33642578125, 11.7288818359375, 12.121337890625, 12.5137939453125, 12.90625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 5.0, 4.0, 11.0, 9.0, 18.0, 14.0, 14.0, 21.0, 32.0, 23.0, 34.0, 34.0, 50.0, 66.0, 107.0, 232.0, 1375.0, 614992.0, 3573904.0, 2555.0, 298.0, 111.0, 58.0, 49.0, 50.0, 25.0, 33.0, 28.0, 29.0, 22.0, 17.0, 11.0, 6.0, 9.0, 4.0, 5.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-87.375, -84.564453125, -81.75390625, -78.943359375, -76.1328125, -73.322265625, -70.51171875, -67.701171875, -64.890625, -62.080078125, -59.26953125, -56.458984375, -53.6484375, -50.837890625, -48.02734375, -45.216796875, -42.40625, -39.595703125, -36.78515625, -33.974609375, -31.1640625, -28.353515625, -25.54296875, -22.732421875, -19.921875, -17.111328125, -14.30078125, -11.490234375, -8.6796875, -5.869140625, -3.05859375, -0.248046875, 2.5625, 5.373046875, 8.18359375, 10.994140625, 13.8046875, 16.615234375, 19.42578125, 22.236328125, 25.046875, 27.857421875, 30.66796875, 33.478515625, 36.2890625, 39.099609375, 41.91015625, 44.720703125, 47.53125, 50.341796875, 53.15234375, 55.962890625, 58.7734375, 61.583984375, 64.39453125, 67.205078125, 70.015625, 72.826171875, 75.63671875, 78.447265625, 81.2578125, 84.068359375, 86.87890625, 89.689453125, 92.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 15.0, 212.0, 597.0, 180.0, 12.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-352.480224609375, -345.3531188964844, -338.22601318359375, -331.098876953125, -323.9717712402344, -316.84466552734375, -309.7175598144531, -302.5904541015625, -295.46331787109375, -288.3362121582031, -281.2091064453125, -274.08197021484375, -266.9548645019531, -259.8277587890625, -252.70065307617188, -245.5735321044922, -238.44644165039062, -231.3193359375, -224.1922149658203, -217.0651092529297, -209.93798828125, -202.81088256835938, -195.68377685546875, -188.55665588378906, -181.42953491210938, -174.30242919921875, -167.17530822753906, -160.04820251464844, -152.92108154296875, -145.79397583007812, -138.6668701171875, -131.5397491455078, -124.41263580322266, -117.2855224609375, -110.15840911865234, -103.03129577636719, -95.90419006347656, -88.7770767211914, -81.64996337890625, -74.52285766601562, -67.39573669433594, -60.26862335205078, -53.14151382446289, -46.014400482177734, -38.887290954589844, -31.760177612304688, -24.63306427001953, -17.50595474243164, -10.37884521484375, -3.2517333030700684, 3.8753786087036133, 11.002490997314453, 18.129602432250977, 25.2567138671875, 32.383827209472656, 39.51093673706055, 46.6380500793457, 53.76516342163086, 60.89227294921875, 68.0193862915039, 75.14649963378906, 82.27360534667969, 89.40072631835938, 96.52783203125, 103.65494537353516]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 8.0, 9.0, 10.0, 10.0, 13.0, 10.0, 17.0, 20.0, 25.0, 28.0, 29.0, 30.0, 26.0, 39.0, 34.0, 27.0, 45.0, 40.0, 44.0, 36.0, 55.0, 39.0, 45.0, 40.0, 30.0, 38.0, 28.0, 30.0, 21.0, 22.0, 19.0, 26.0, 21.0, 10.0, 11.0, 8.0, 9.0, 12.0, 9.0, 4.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-37.92347717285156, -36.63508987426758, -35.34669876098633, -34.058311462402344, -32.769920349121094, -31.48153305053711, -30.193143844604492, -28.904754638671875, -27.616365432739258, -26.32797622680664, -25.039587020874023, -23.751197814941406, -22.462810516357422, -21.174419403076172, -19.886032104492188, -18.59764289855957, -17.309253692626953, -16.020864486694336, -14.732475280761719, -13.444087028503418, -12.1556978225708, -10.867308616638184, -9.578920364379883, -8.290531158447266, -7.002141952514648, -5.713752746582031, -4.425364017486572, -3.136975049972534, -1.848586082458496, -0.5601968765258789, 0.7281918525695801, 2.016580581665039, 3.3049697875976562, 4.593358993530273, 5.881747722625732, 7.170136451721191, 8.458525657653809, 9.746914863586426, 11.035303115844727, 12.323692321777344, 13.612081527709961, 14.900470733642578, 16.188859939575195, 17.477249145507812, 18.765636444091797, 20.054027557373047, 21.34241485595703, 22.63080406188965, 23.919193267822266, 25.207582473754883, 26.4959716796875, 27.784360885620117, 29.072750091552734, 30.36113739013672, 31.649526596069336, 32.93791580200195, 34.22630310058594, 35.51469039916992, 36.80308151245117, 38.091468811035156, 39.379859924316406, 40.66824722290039, 41.95663833618164, 43.245025634765625, 44.533416748046875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 12.0, 7.0, 7.0, 14.0, 14.0, 12.0, 18.0, 21.0, 30.0, 23.0, 32.0, 40.0, 45.0, 33.0, 41.0, 36.0, 49.0, 36.0, 47.0, 43.0, 50.0, 38.0, 37.0, 36.0, 40.0, 36.0, 20.0, 28.0, 21.0, 25.0, 17.0, 19.0, 8.0, 11.0, 8.0, 12.0, 3.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.9375, -9.6617431640625, -9.385986328125, -9.1102294921875, -8.83447265625, -8.5587158203125, -8.282958984375, -8.0072021484375, -7.7314453125, -7.4556884765625, -7.179931640625, -6.9041748046875, -6.62841796875, -6.3526611328125, -6.076904296875, -5.8011474609375, -5.525390625, -5.2496337890625, -4.973876953125, -4.6981201171875, -4.42236328125, -4.1466064453125, -3.870849609375, -3.5950927734375, -3.3193359375, -3.0435791015625, -2.767822265625, -2.4920654296875, -2.21630859375, -1.9405517578125, -1.664794921875, -1.3890380859375, -1.11328125, -0.8375244140625, -0.561767578125, -0.2860107421875, -0.01025390625, 0.2655029296875, 0.541259765625, 0.8170166015625, 1.0927734375, 1.3685302734375, 1.644287109375, 1.9200439453125, 2.19580078125, 2.4715576171875, 2.747314453125, 3.0230712890625, 3.298828125, 3.5745849609375, 3.850341796875, 4.1260986328125, 4.40185546875, 4.6776123046875, 4.953369140625, 5.2291259765625, 5.5048828125, 5.7806396484375, 6.056396484375, 6.3321533203125, 6.60791015625, 6.8836669921875, 7.159423828125, 7.4351806640625, 7.7109375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 7.0, 9.0, 11.0, 25.0, 26.0, 40.0, 69.0, 98.0, 163.0, 261.0, 343.0, 520.0, 764.0, 1135.0, 1702.0, 2519.0, 3704.0, 5661.0, 8427.0, 12864.0, 19767.0, 31008.0, 48648.0, 78031.0, 121896.0, 169559.0, 174708.0, 131524.0, 85319.0, 52986.0, 33775.0, 21298.0, 14158.0, 9106.0, 6143.0, 4048.0, 2769.0, 1780.0, 1214.0, 832.0, 544.0, 412.0, 236.0, 165.0, 104.0, 64.0, 49.0, 21.0, 27.0, 10.0, 8.0, 4.0, 1.0, 3.0], "bins": [-0.779296875, -0.7577056884765625, -0.736114501953125, -0.7145233154296875, -0.69293212890625, -0.6713409423828125, -0.649749755859375, -0.6281585693359375, -0.6065673828125, -0.5849761962890625, -0.563385009765625, -0.5417938232421875, -0.52020263671875, -0.4986114501953125, -0.477020263671875, -0.4554290771484375, -0.433837890625, -0.4122467041015625, -0.390655517578125, -0.3690643310546875, -0.34747314453125, -0.3258819580078125, -0.304290771484375, -0.2826995849609375, -0.2611083984375, -0.2395172119140625, -0.217926025390625, -0.1963348388671875, -0.17474365234375, -0.1531524658203125, -0.131561279296875, -0.1099700927734375, -0.08837890625, -0.0667877197265625, -0.045196533203125, -0.0236053466796875, -0.00201416015625, 0.0195770263671875, 0.041168212890625, 0.0627593994140625, 0.0843505859375, 0.1059417724609375, 0.127532958984375, 0.1491241455078125, 0.17071533203125, 0.1923065185546875, 0.213897705078125, 0.2354888916015625, 0.257080078125, 0.2786712646484375, 0.300262451171875, 0.3218536376953125, 0.34344482421875, 0.3650360107421875, 0.386627197265625, 0.4082183837890625, 0.4298095703125, 0.4514007568359375, 0.472991943359375, 0.4945831298828125, 0.51617431640625, 0.5377655029296875, 0.559356689453125, 0.5809478759765625, 0.6025390625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 8.0, 7.0, 10.0, 11.0, 14.0, 16.0, 23.0, 24.0, 21.0, 35.0, 28.0, 35.0, 42.0, 33.0, 47.0, 34.0, 34.0, 33.0, 39.0, 1075.0, 52.0, 37.0, 33.0, 37.0, 33.0, 28.0, 34.0, 22.0, 33.0, 23.0, 18.0, 25.0, 14.0, 11.0, 13.0, 8.0, 7.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-5.69140625, -5.5263671875, -5.361328125, -5.1962890625, -5.03125, -4.8662109375, -4.701171875, -4.5361328125, -4.37109375, -4.2060546875, -4.041015625, -3.8759765625, -3.7109375, -3.5458984375, -3.380859375, -3.2158203125, -3.05078125, -2.8857421875, -2.720703125, -2.5556640625, -2.390625, -2.2255859375, -2.060546875, -1.8955078125, -1.73046875, -1.5654296875, -1.400390625, -1.2353515625, -1.0703125, -0.9052734375, -0.740234375, -0.5751953125, -0.41015625, -0.2451171875, -0.080078125, 0.0849609375, 0.25, 0.4150390625, 0.580078125, 0.7451171875, 0.91015625, 1.0751953125, 1.240234375, 1.4052734375, 1.5703125, 1.7353515625, 1.900390625, 2.0654296875, 2.23046875, 2.3955078125, 2.560546875, 2.7255859375, 2.890625, 3.0556640625, 3.220703125, 3.3857421875, 3.55078125, 3.7158203125, 3.880859375, 4.0458984375, 4.2109375, 4.3759765625, 4.541015625, 4.7060546875, 4.87109375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 8.0, 2.0, 5.0, 6.0, 8.0, 9.0, 15.0, 23.0, 30.0, 45.0, 94.0, 111.0, 173.0, 274.0, 448.0, 644.0, 1010.0, 1592.0, 2666.0, 4176.0, 6750.0, 11213.0, 19230.0, 33698.0, 59110.0, 104298.0, 170511.0, 1262386.0, 171240.0, 104959.0, 59964.0, 33865.0, 19300.0, 11247.0, 6790.0, 3983.0, 2710.0, 1642.0, 1015.0, 671.0, 436.0, 276.0, 163.0, 136.0, 69.0, 51.0, 27.0, 35.0, 7.0, 12.0, 8.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6699752807617188, -0.6456146240234375, -0.6212539672851562, -0.596893310546875, -0.5725326538085938, -0.5481719970703125, -0.5238113403320312, -0.49945068359375, -0.47509002685546875, -0.4507293701171875, -0.42636871337890625, -0.402008056640625, -0.37764739990234375, -0.3532867431640625, -0.32892608642578125, -0.3045654296875, -0.28020477294921875, -0.2558441162109375, -0.23148345947265625, -0.207122802734375, -0.18276214599609375, -0.1584014892578125, -0.13404083251953125, -0.10968017578125, -0.08531951904296875, -0.0609588623046875, -0.03659820556640625, -0.012237548828125, 0.01212310791015625, 0.0364837646484375, 0.06084442138671875, 0.085205078125, 0.10956573486328125, 0.1339263916015625, 0.15828704833984375, 0.182647705078125, 0.20700836181640625, 0.2313690185546875, 0.25572967529296875, 0.28009033203125, 0.30445098876953125, 0.3288116455078125, 0.35317230224609375, 0.377532958984375, 0.40189361572265625, 0.4262542724609375, 0.45061492919921875, 0.4749755859375, 0.49933624267578125, 0.5236968994140625, 0.5480575561523438, 0.572418212890625, 0.5967788696289062, 0.6211395263671875, 0.6455001831054688, 0.66986083984375, 0.6942214965820312, 0.7185821533203125, 0.7429428100585938, 0.767303466796875, 0.7916641235351562, 0.8160247802734375, 0.8403854370117188, 0.86474609375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 4.0, 4.0, 12.0, 12.0, 15.0, 13.0, 21.0, 22.0, 28.0, 35.0, 33.0, 35.0, 39.0, 36.0, 44.0, 50.0, 59.0, 67.0, 53.0, 55.0, 37.0, 48.0, 33.0, 46.0, 31.0, 20.0, 20.0, 23.0, 21.0, 18.0, 12.0, 13.0, 10.0, 12.0, 1.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0021209716796875, -0.002055138349533081, -0.001989305019378662, -0.0019234716892242432, -0.0018576383590698242, -0.0017918050289154053, -0.0017259716987609863, -0.0016601383686065674, -0.0015943050384521484, -0.0015284717082977295, -0.0014626383781433105, -0.0013968050479888916, -0.0013309717178344727, -0.0012651383876800537, -0.0011993050575256348, -0.0011334717273712158, -0.0010676383972167969, -0.001001805067062378, -0.000935971736907959, -0.00087013840675354, -0.0008043050765991211, -0.0007384717464447021, -0.0006726384162902832, -0.0006068050861358643, -0.0005409717559814453, -0.00047513842582702637, -0.0004093050956726074, -0.0003434717655181885, -0.00027763843536376953, -0.00021180510520935059, -0.00014597177505493164, -8.01384449005127e-05, -1.430511474609375e-05, 5.1528215408325195e-05, 0.00011736154556274414, 0.00018319487571716309, 0.00024902820587158203, 0.000314861536026001, 0.0003806948661804199, 0.00044652819633483887, 0.0005123615264892578, 0.0005781948566436768, 0.0006440281867980957, 0.0007098615169525146, 0.0007756948471069336, 0.0008415281772613525, 0.0009073615074157715, 0.0009731948375701904, 0.0010390281677246094, 0.0011048614978790283, 0.0011706948280334473, 0.0012365281581878662, 0.0013023614883422852, 0.001368194818496704, 0.001434028148651123, 0.001499861478805542, 0.001565694808959961, 0.0016315281391143799, 0.0016973614692687988, 0.0017631947994232178, 0.0018290281295776367, 0.0018948614597320557, 0.0019606947898864746, 0.0020265281200408936, 0.0020923614501953125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 6.0, 11.0, 9.0, 19.0, 21.0, 23.0, 27.0, 45.0, 34.0, 50.0, 64.0, 62.0, 93.0, 124.0, 234.0, 298.0, 464.0, 688.0, 2090.0, 772029.0, 268637.0, 1431.0, 642.0, 418.0, 279.0, 186.0, 140.0, 77.0, 67.0, 68.0, 39.0, 39.0, 26.0, 29.0, 18.0, 16.0, 9.0, 10.0, 9.0, 8.0, 4.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03790283203125, -0.03671455383300781, -0.035526275634765625, -0.03433799743652344, -0.03314971923828125, -0.03196144104003906, -0.030773162841796875, -0.029584884643554688, -0.0283966064453125, -0.027208328247070312, -0.026020050048828125, -0.024831771850585938, -0.02364349365234375, -0.022455215454101562, -0.021266937255859375, -0.020078659057617188, -0.018890380859375, -0.017702102661132812, -0.016513824462890625, -0.015325546264648438, -0.01413726806640625, -0.012948989868164062, -0.011760711669921875, -0.010572433471679688, -0.0093841552734375, -0.008195877075195312, -0.007007598876953125, -0.0058193206787109375, -0.00463104248046875, -0.0034427642822265625, -0.002254486083984375, -0.0010662078857421875, 0.0001220703125, 0.0013103485107421875, 0.002498626708984375, 0.0036869049072265625, 0.00487518310546875, 0.0060634613037109375, 0.007251739501953125, 0.008440017700195312, 0.0096282958984375, 0.010816574096679688, 0.012004852294921875, 0.013193130493164062, 0.01438140869140625, 0.015569686889648438, 0.016757965087890625, 0.017946243286132812, 0.019134521484375, 0.020322799682617188, 0.021511077880859375, 0.022699356079101562, 0.02388763427734375, 0.025075912475585938, 0.026264190673828125, 0.027452468872070312, 0.0286407470703125, 0.029829025268554688, 0.031017303466796875, 0.03220558166503906, 0.03339385986328125, 0.03458213806152344, 0.035770416259765625, 0.03695869445800781, 0.03814697265625]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 15.0, 98.0, 493.0, 356.0, 47.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008333198726177216, -0.008133966475725174, -0.007934734225273132, -0.007735501974821091, -0.007536269724369049, -0.0073370374739170074, -0.007137805689126253, -0.0069385734386742115, -0.00673934118822217, -0.006540108937770128, -0.006340876687318087, -0.006141644436866045, -0.005942412652075291, -0.005743180401623249, -0.005543948151171207, -0.005344715900719166, -0.005145483650267124, -0.0049462513998150826, -0.004747019149363041, -0.004547786898910999, -0.004348554648458958, -0.004149322398006916, -0.003950090613216162, -0.00375085836276412, -0.0035516261123120785, -0.003352393861860037, -0.0031531616114079952, -0.0029539295937865973, -0.0027546973433345556, -0.002555465092882514, -0.002356233075261116, -0.0021570008248090744, -0.00195776904001832, -0.0017585367895662785, -0.0015593046555295587, -0.0013600725214928389, -0.0011608402710407972, -0.0009616080205887556, -0.0007623758865520358, -0.000563143752515316, -0.0003639115020632744, -0.00016467930981889367, 3.455288242548704e-05, 0.00023378507466986775, 0.00043301726691424847, 0.0006322495173662901, 0.0008314816514030099, 0.0010307137854397297, 0.0012299460358917713, 0.001429178286343813, 0.0016284104203805327, 0.0018276425544172525, 0.002026874804869294, 0.002226107055321336, 0.0024253390729427338, 0.0026245713233947754, 0.002823803573846817, 0.0030230358242988586, 0.0032222680747509003, 0.0034215000923722982, 0.00362073234282434, 0.0038199645932763815, 0.0040191966108977795, 0.004218428861349821, 0.004417661111801863]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 4.0, 5.0, 2.0, 8.0, 10.0, 14.0, 8.0, 10.0, 16.0, 21.0, 19.0, 21.0, 21.0, 22.0, 42.0, 27.0, 38.0, 44.0, 34.0, 31.0, 44.0, 36.0, 46.0, 37.0, 45.0, 50.0, 30.0, 40.0, 40.0, 39.0, 27.0, 24.0, 17.0, 24.0, 25.0, 19.0, 14.0, 12.0, 10.0, 6.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.0013255476951599121, -0.0012887725606560707, -0.0012519974261522293, -0.001215222291648388, -0.0011784471571445465, -0.0011416720226407051, -0.0011048968881368637, -0.0010681217536330223, -0.001031346619129181, -0.0009945714846253395, -0.0009577963501214981, -0.0009210212156176567, -0.0008842460811138153, -0.0008474709466099739, -0.0008106958121061325, -0.0007739206776022911, -0.0007371455430984497, -0.0007003704085946083, -0.0006635952740907669, -0.0006268201395869255, -0.0005900450050830841, -0.0005532698705792427, -0.0005164947360754013, -0.0004797196015715599, -0.0004429444670677185, -0.0004061693325638771, -0.0003693941980600357, -0.0003326190635561943, -0.0002958439290523529, -0.0002590687945485115, -0.0002222936600446701, -0.0001855185255408287, -0.0001487433910369873, -0.0001119682565331459, -7.51931220293045e-05, -3.8417987525463104e-05, -1.642853021621704e-06, 3.5132281482219696e-05, 7.19074159860611e-05, 0.0001086825504899025, 0.0001454576849937439, 0.0001822328194975853, 0.0002190079540014267, 0.0002557830885052681, 0.0002925582230091095, 0.0003293333575129509, 0.0003661084920167923, 0.0004028836265206337, 0.0004396587610244751, 0.0004764338955283165, 0.0005132090300321579, 0.0005499841645359993, 0.0005867592990398407, 0.0006235344335436821, 0.0006603095680475235, 0.0006970847025513649, 0.0007338598370552063, 0.0007706349715590477, 0.0008074101060628891, 0.0008441852405667305, 0.0008809603750705719, 0.0009177355095744133, 0.0009545106440782547, 0.000991285778582096, 0.0010280609130859375]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 8.0, 8.0, 12.0, 7.0, 7.0, 14.0, 14.0, 12.0, 18.0, 21.0, 30.0, 24.0, 31.0, 40.0, 45.0, 33.0, 41.0, 36.0, 49.0, 36.0, 47.0, 43.0, 50.0, 38.0, 37.0, 36.0, 40.0, 36.0, 20.0, 28.0, 21.0, 25.0, 17.0, 19.0, 8.0, 11.0, 8.0, 12.0, 3.0, 5.0, 4.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0], "bins": [-9.9375, -9.6617431640625, -9.385986328125, -9.1102294921875, -8.83447265625, -8.5587158203125, -8.282958984375, -8.0072021484375, -7.7314453125, -7.4556884765625, -7.179931640625, -6.9041748046875, -6.62841796875, -6.3526611328125, -6.076904296875, -5.8011474609375, -5.525390625, -5.2496337890625, -4.973876953125, -4.6981201171875, -4.42236328125, -4.1466064453125, -3.870849609375, -3.5950927734375, -3.3193359375, -3.0435791015625, -2.767822265625, -2.4920654296875, -2.21630859375, -1.9405517578125, -1.664794921875, -1.3890380859375, -1.11328125, -0.8375244140625, -0.561767578125, -0.2860107421875, -0.01025390625, 0.2655029296875, 0.541259765625, 0.8170166015625, 1.0927734375, 1.3685302734375, 1.644287109375, 1.9200439453125, 2.19580078125, 2.4715576171875, 2.747314453125, 3.0230712890625, 3.298828125, 3.5745849609375, 3.850341796875, 4.1260986328125, 4.40185546875, 4.6776123046875, 4.953369140625, 5.2291259765625, 5.5048828125, 5.7806396484375, 6.056396484375, 6.3321533203125, 6.60791015625, 6.8836669921875, 7.159423828125, 7.4351806640625, 7.7109375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 1.0, 7.0, 9.0, 15.0, 15.0, 26.0, 33.0, 50.0, 69.0, 103.0, 152.0, 198.0, 241.0, 304.0, 482.0, 624.0, 863.0, 1193.0, 2099.0, 4799.0, 18421.0, 122084.0, 595023.0, 250434.0, 36207.0, 7377.0, 2635.0, 1483.0, 999.0, 698.0, 513.0, 354.0, 272.0, 236.0, 153.0, 107.0, 75.0, 59.0, 44.0, 39.0, 20.0, 14.0, 7.0, 12.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.140625, -14.647216796875, -14.15380859375, -13.660400390625, -13.1669921875, -12.673583984375, -12.18017578125, -11.686767578125, -11.193359375, -10.699951171875, -10.20654296875, -9.713134765625, -9.2197265625, -8.726318359375, -8.23291015625, -7.739501953125, -7.24609375, -6.752685546875, -6.25927734375, -5.765869140625, -5.2724609375, -4.779052734375, -4.28564453125, -3.792236328125, -3.298828125, -2.805419921875, -2.31201171875, -1.818603515625, -1.3251953125, -0.831787109375, -0.33837890625, 0.155029296875, 0.6484375, 1.141845703125, 1.63525390625, 2.128662109375, 2.6220703125, 3.115478515625, 3.60888671875, 4.102294921875, 4.595703125, 5.089111328125, 5.58251953125, 6.075927734375, 6.5693359375, 7.062744140625, 7.55615234375, 8.049560546875, 8.54296875, 9.036376953125, 9.52978515625, 10.023193359375, 10.5166015625, 11.010009765625, 11.50341796875, 11.996826171875, 12.490234375, 12.983642578125, 13.47705078125, 13.970458984375, 14.4638671875, 14.957275390625, 15.45068359375, 15.944091796875, 16.4375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 8.0, 7.0, 11.0, 20.0, 21.0, 20.0, 26.0, 41.0, 48.0, 48.0, 41.0, 61.0, 92.0, 242.0, 1619.0, 228.0, 106.0, 73.0, 49.0, 42.0, 45.0, 30.0, 26.0, 22.0, 24.0, 14.0, 19.0, 12.0, 6.0, 14.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-28.1875, -27.36962890625, -26.5517578125, -25.73388671875, -24.916015625, -24.09814453125, -23.2802734375, -22.46240234375, -21.64453125, -20.82666015625, -20.0087890625, -19.19091796875, -18.373046875, -17.55517578125, -16.7373046875, -15.91943359375, -15.1015625, -14.28369140625, -13.4658203125, -12.64794921875, -11.830078125, -11.01220703125, -10.1943359375, -9.37646484375, -8.55859375, -7.74072265625, -6.9228515625, -6.10498046875, -5.287109375, -4.46923828125, -3.6513671875, -2.83349609375, -2.015625, -1.19775390625, -0.3798828125, 0.43798828125, 1.255859375, 2.07373046875, 2.8916015625, 3.70947265625, 4.52734375, 5.34521484375, 6.1630859375, 6.98095703125, 7.798828125, 8.61669921875, 9.4345703125, 10.25244140625, 11.0703125, 11.88818359375, 12.7060546875, 13.52392578125, 14.341796875, 15.15966796875, 15.9775390625, 16.79541015625, 17.61328125, 18.43115234375, 19.2490234375, 20.06689453125, 20.884765625, 21.70263671875, 22.5205078125, 23.33837890625, 24.15625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 8.0, 14.0, 15.0, 19.0, 19.0, 27.0, 42.0, 65.0, 80.0, 118.0, 169.0, 299.0, 584.0, 1456.0, 132198.0, 3006512.0, 2340.0, 721.0, 353.0, 197.0, 133.0, 79.0, 53.0, 47.0, 29.0, 19.0, 18.0, 20.0, 17.0, 8.0, 5.0, 6.0, 7.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-68.75, -66.3916015625, -64.033203125, -61.6748046875, -59.31640625, -56.9580078125, -54.599609375, -52.2412109375, -49.8828125, -47.5244140625, -45.166015625, -42.8076171875, -40.44921875, -38.0908203125, -35.732421875, -33.3740234375, -31.015625, -28.6572265625, -26.298828125, -23.9404296875, -21.58203125, -19.2236328125, -16.865234375, -14.5068359375, -12.1484375, -9.7900390625, -7.431640625, -5.0732421875, -2.71484375, -0.3564453125, 2.001953125, 4.3603515625, 6.71875, 9.0771484375, 11.435546875, 13.7939453125, 16.15234375, 18.5107421875, 20.869140625, 23.2275390625, 25.5859375, 27.9443359375, 30.302734375, 32.6611328125, 35.01953125, 37.3779296875, 39.736328125, 42.0947265625, 44.453125, 46.8115234375, 49.169921875, 51.5283203125, 53.88671875, 56.2451171875, 58.603515625, 60.9619140625, 63.3203125, 65.6787109375, 68.037109375, 70.3955078125, 72.75390625, 75.1123046875, 77.470703125, 79.8291015625, 82.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 38.0, 306.0, 541.0, 111.0, 16.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.43982696533203, -121.96460723876953, -117.4893798828125, -113.01416015625, -108.53893280029297, -104.06371307373047, -99.58848571777344, -95.11326599121094, -90.63804626464844, -86.16282653808594, -81.6875991821289, -77.2123794555664, -72.73715209960938, -68.26193237304688, -63.78670883178711, -59.311485290527344, -54.83625793457031, -50.36103439331055, -45.88581085205078, -41.41059112548828, -36.93536376953125, -32.46014404296875, -27.984920501708984, -23.50969696044922, -19.034473419189453, -14.559249877929688, -10.084027290344238, -5.608804702758789, -1.1335811614990234, 3.341642379760742, 7.816864013671875, 12.29208755493164, 16.767303466796875, 21.24252700805664, 25.717750549316406, 30.19297218322754, 34.66819763183594, 39.14341735839844, 43.6186408996582, 48.09386444091797, 52.569087982177734, 57.0443115234375, 61.519535064697266, 65.99475860595703, 70.46997833251953, 74.94520568847656, 79.42042541503906, 83.89564514160156, 88.3708724975586, 92.8460922241211, 97.32131958007812, 101.79653930664062, 106.27176666259766, 110.74698638916016, 115.22221374511719, 119.69743347167969, 124.17265319824219, 128.6478729248047, 133.1230926513672, 137.59832763671875, 142.07354736328125, 146.54876708984375, 151.02398681640625, 155.49920654296875, 159.9744415283203]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 7.0, 12.0, 11.0, 10.0, 12.0, 16.0, 17.0, 16.0, 27.0, 24.0, 29.0, 40.0, 50.0, 36.0, 45.0, 49.0, 37.0, 44.0, 49.0, 30.0, 49.0, 35.0, 36.0, 44.0, 38.0, 26.0, 24.0, 33.0, 26.0, 16.0, 10.0, 17.0, 7.0, 23.0, 21.0, 7.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-69.66645812988281, -67.56433868408203, -65.46222686767578, -63.360107421875, -61.257991790771484, -59.15587615966797, -57.05375671386719, -54.95164108276367, -52.849525451660156, -50.74740982055664, -48.645294189453125, -46.543174743652344, -44.44105911254883, -42.33894348144531, -40.23682403564453, -38.134708404541016, -36.0325927734375, -33.930477142333984, -31.828359603881836, -29.726242065429688, -27.624126434326172, -25.522010803222656, -23.419893264770508, -21.31777572631836, -19.215660095214844, -17.113544464111328, -15.01142692565918, -12.909310340881348, -10.807193756103516, -8.705077171325684, -6.602960586547852, -4.5008440017700195, -2.3987274169921875, -0.29661083221435547, 1.8055057525634766, 3.9076223373413086, 6.009738922119141, 8.111855506896973, 10.213972091674805, 12.316088676452637, 14.418205261230469, 16.520320892333984, 18.622438430786133, 20.72455596923828, 22.826671600341797, 24.928787231445312, 27.03090476989746, 29.13302230834961, 31.235137939453125, 33.33725357055664, 35.439369201660156, 37.54148864746094, 39.64360427856445, 41.74571990966797, 43.84783935546875, 45.949954986572266, 48.05207061767578, 50.1541862487793, 52.25630187988281, 54.358421325683594, 56.46053695678711, 58.562652587890625, 60.664772033691406, 62.76688766479492, 64.86900329589844]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 11.0, 5.0, 13.0, 12.0, 17.0, 13.0, 19.0, 20.0, 32.0, 21.0, 33.0, 44.0, 41.0, 29.0, 36.0, 38.0, 41.0, 56.0, 37.0, 45.0, 37.0, 42.0, 39.0, 36.0, 24.0, 34.0, 34.0, 25.0, 15.0, 27.0, 14.0, 18.0, 18.0, 9.0, 12.0, 7.0, 4.0, 6.0, 8.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-9.7109375, -9.44049072265625, -9.1700439453125, -8.89959716796875, -8.629150390625, -8.35870361328125, -8.0882568359375, -7.81781005859375, -7.54736328125, -7.27691650390625, -7.0064697265625, -6.73602294921875, -6.465576171875, -6.19512939453125, -5.9246826171875, -5.65423583984375, -5.3837890625, -5.11334228515625, -4.8428955078125, -4.57244873046875, -4.302001953125, -4.03155517578125, -3.7611083984375, -3.49066162109375, -3.22021484375, -2.94976806640625, -2.6793212890625, -2.40887451171875, -2.138427734375, -1.86798095703125, -1.5975341796875, -1.32708740234375, -1.056640625, -0.78619384765625, -0.5157470703125, -0.24530029296875, 0.025146484375, 0.29559326171875, 0.5660400390625, 0.83648681640625, 1.10693359375, 1.37738037109375, 1.6478271484375, 1.91827392578125, 2.188720703125, 2.45916748046875, 2.7296142578125, 3.00006103515625, 3.2705078125, 3.54095458984375, 3.8114013671875, 4.08184814453125, 4.352294921875, 4.62274169921875, 4.8931884765625, 5.16363525390625, 5.43408203125, 5.70452880859375, 5.9749755859375, 6.24542236328125, 6.515869140625, 6.78631591796875, 7.0567626953125, 7.32720947265625, 7.59765625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 9.0, 2.0, 8.0, 11.0, 20.0, 9.0, 29.0, 28.0, 34.0, 46.0, 60.0, 61.0, 74.0, 91.0, 123.0, 177.0, 266.0, 507.0, 1044.0, 2794.0, 10288.0, 79171.0, 1047261.0, 2610108.0, 398757.0, 33436.0, 5928.0, 1807.0, 797.0, 391.0, 220.0, 159.0, 113.0, 95.0, 75.0, 74.0, 41.0, 36.0, 37.0, 21.0, 21.0, 20.0, 9.0, 8.0, 6.0, 5.0, 2.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-19.75, -19.156982421875, -18.56396484375, -17.970947265625, -17.3779296875, -16.784912109375, -16.19189453125, -15.598876953125, -15.005859375, -14.412841796875, -13.81982421875, -13.226806640625, -12.6337890625, -12.040771484375, -11.44775390625, -10.854736328125, -10.26171875, -9.668701171875, -9.07568359375, -8.482666015625, -7.8896484375, -7.296630859375, -6.70361328125, -6.110595703125, -5.517578125, -4.924560546875, -4.33154296875, -3.738525390625, -3.1455078125, -2.552490234375, -1.95947265625, -1.366455078125, -0.7734375, -0.180419921875, 0.41259765625, 1.005615234375, 1.5986328125, 2.191650390625, 2.78466796875, 3.377685546875, 3.970703125, 4.563720703125, 5.15673828125, 5.749755859375, 6.3427734375, 6.935791015625, 7.52880859375, 8.121826171875, 8.71484375, 9.307861328125, 9.90087890625, 10.493896484375, 11.0869140625, 11.679931640625, 12.27294921875, 12.865966796875, 13.458984375, 14.052001953125, 14.64501953125, 15.238037109375, 15.8310546875, 16.424072265625, 17.01708984375, 17.610107421875, 18.203125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 4.0, 12.0, 12.0, 16.0, 26.0, 24.0, 36.0, 33.0, 46.0, 69.0, 79.0, 105.0, 125.0, 173.0, 220.0, 336.0, 449.0, 524.0, 473.0, 327.0, 257.0, 180.0, 119.0, 92.0, 78.0, 49.0, 52.0, 34.0, 27.0, 24.0, 12.0, 20.0, 10.0, 4.0, 10.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.5318603515625, -15.094970703125, -14.6580810546875, -14.22119140625, -13.7843017578125, -13.347412109375, -12.9105224609375, -12.4736328125, -12.0367431640625, -11.599853515625, -11.1629638671875, -10.72607421875, -10.2891845703125, -9.852294921875, -9.4154052734375, -8.978515625, -8.5416259765625, -8.104736328125, -7.6678466796875, -7.23095703125, -6.7940673828125, -6.357177734375, -5.9202880859375, -5.4833984375, -5.0465087890625, -4.609619140625, -4.1727294921875, -3.73583984375, -3.2989501953125, -2.862060546875, -2.4251708984375, -1.98828125, -1.5513916015625, -1.114501953125, -0.6776123046875, -0.24072265625, 0.1961669921875, 0.633056640625, 1.0699462890625, 1.5068359375, 1.9437255859375, 2.380615234375, 2.8175048828125, 3.25439453125, 3.6912841796875, 4.128173828125, 4.5650634765625, 5.001953125, 5.4388427734375, 5.875732421875, 6.3126220703125, 6.74951171875, 7.1864013671875, 7.623291015625, 8.0601806640625, 8.4970703125, 8.9339599609375, 9.370849609375, 9.8077392578125, 10.24462890625, 10.6815185546875, 11.118408203125, 11.5552978515625, 11.9921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 8.0, 8.0, 13.0, 21.0, 41.0, 55.0, 125.0, 223.0, 513.0, 1362.0, 8255.0, 741431.0, 3417128.0, 21618.0, 2054.0, 736.0, 266.0, 190.0, 99.0, 50.0, 37.0, 20.0, 13.0, 12.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.1875, -65.63037109375, -64.0732421875, -62.51611328125, -60.958984375, -59.40185546875, -57.8447265625, -56.28759765625, -54.73046875, -53.17333984375, -51.6162109375, -50.05908203125, -48.501953125, -46.94482421875, -45.3876953125, -43.83056640625, -42.2734375, -40.71630859375, -39.1591796875, -37.60205078125, -36.044921875, -34.48779296875, -32.9306640625, -31.37353515625, -29.81640625, -28.25927734375, -26.7021484375, -25.14501953125, -23.587890625, -22.03076171875, -20.4736328125, -18.91650390625, -17.359375, -15.80224609375, -14.2451171875, -12.68798828125, -11.130859375, -9.57373046875, -8.0166015625, -6.45947265625, -4.90234375, -3.34521484375, -1.7880859375, -0.23095703125, 1.326171875, 2.88330078125, 4.4404296875, 5.99755859375, 7.5546875, 9.11181640625, 10.6689453125, 12.22607421875, 13.783203125, 15.34033203125, 16.8974609375, 18.45458984375, 20.01171875, 21.56884765625, 23.1259765625, 24.68310546875, 26.240234375, 27.79736328125, 29.3544921875, 30.91162109375, 32.46875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 8.0, 16.0, 39.0, 88.0, 149.0, 197.0, 189.0, 174.0, 89.0, 33.0, 17.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-86.7997817993164, -84.00353240966797, -81.20729064941406, -78.41104125976562, -75.61479949951172, -72.81855010986328, -70.02230834960938, -67.22605895996094, -64.4298095703125, -61.63356399536133, -58.837318420410156, -56.04106903076172, -53.24482727050781, -50.448577880859375, -47.6523323059082, -44.85608673095703, -42.059844970703125, -39.26359939575195, -36.46735382080078, -33.671104431152344, -30.874860763549805, -28.078615188598633, -25.282367706298828, -22.486122131347656, -19.689876556396484, -16.893630981445312, -14.097384452819824, -11.301137924194336, -8.504892349243164, -5.708646774291992, -2.9123992919921875, -0.11615371704101562, 2.680084228515625, 5.476330280303955, 8.272576332092285, 11.068822860717773, 13.865068435668945, 16.661314010620117, 19.457561492919922, 22.253807067871094, 25.050052642822266, 27.846298217773438, 30.64254379272461, 33.43878936767578, 36.23503875732422, 39.031280517578125, 41.82752990722656, 44.623775482177734, 47.420021057128906, 50.21626663208008, 53.01251220703125, 55.80876159667969, 58.605003356933594, 61.40125274658203, 64.19749450683594, 66.99374389648438, 69.78999328613281, 72.58624267578125, 75.38248443603516, 78.1787338256836, 80.9749755859375, 83.77122497558594, 86.56747436523438, 89.36371612548828, 92.15995788574219]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 6.0, 8.0, 6.0, 9.0, 13.0, 13.0, 18.0, 18.0, 14.0, 19.0, 23.0, 24.0, 30.0, 36.0, 24.0, 34.0, 41.0, 32.0, 46.0, 46.0, 35.0, 35.0, 45.0, 47.0, 45.0, 41.0, 33.0, 32.0, 34.0, 26.0, 18.0, 18.0, 26.0, 17.0, 12.0, 11.0, 12.0, 17.0, 10.0, 6.0, 9.0, 4.0, 4.0, 0.0, 6.0, 3.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.05509948730469, -56.32782745361328, -54.60055160522461, -52.8732795715332, -51.14600372314453, -49.418731689453125, -47.69145965576172, -45.96418380737305, -44.236907958984375, -42.50963592529297, -40.7823600769043, -39.05508804321289, -37.32781219482422, -35.60054016113281, -33.873268127441406, -32.145992279052734, -30.418720245361328, -28.69144630432129, -26.96417236328125, -25.236900329589844, -23.509624481201172, -21.782352447509766, -20.055078506469727, -18.327804565429688, -16.60053062438965, -14.87325668334961, -13.14598274230957, -11.418709754943848, -9.691435813903809, -7.9641618728637695, -6.236888885498047, -4.509614944458008, -2.7823410034179688, -1.0550673007965088, 0.6722064018249512, 2.399479866027832, 4.126753807067871, 5.85402774810791, 7.581300735473633, 9.308574676513672, 11.035848617553711, 12.76312255859375, 14.490396499633789, 16.217670440673828, 17.944942474365234, 19.672218322753906, 21.399490356445312, 23.12676429748535, 24.85403823852539, 26.58131217956543, 28.30858612060547, 30.035858154296875, 31.763134002685547, 33.49040603637695, 35.217681884765625, 36.94495391845703, 38.67222595214844, 40.399497985839844, 42.126773834228516, 43.85404586791992, 45.581321716308594, 47.30859375, 49.035865783691406, 50.76314163208008, 52.49041748046875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 12.0, 12.0, 14.0, 11.0, 22.0, 17.0, 24.0, 30.0, 30.0, 34.0, 34.0, 39.0, 39.0, 42.0, 51.0, 46.0, 49.0, 49.0, 34.0, 44.0, 38.0, 41.0, 44.0, 30.0, 28.0, 20.0, 32.0, 22.0, 23.0, 12.0, 6.0, 17.0, 6.0, 3.0, 3.0, 5.0, 3.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.41796875, -6.207275390625, -5.99658203125, -5.785888671875, -5.5751953125, -5.364501953125, -5.15380859375, -4.943115234375, -4.732421875, -4.521728515625, -4.31103515625, -4.100341796875, -3.8896484375, -3.678955078125, -3.46826171875, -3.257568359375, -3.046875, -2.836181640625, -2.62548828125, -2.414794921875, -2.2041015625, -1.993408203125, -1.78271484375, -1.572021484375, -1.361328125, -1.150634765625, -0.93994140625, -0.729248046875, -0.5185546875, -0.307861328125, -0.09716796875, 0.113525390625, 0.32421875, 0.534912109375, 0.74560546875, 0.956298828125, 1.1669921875, 1.377685546875, 1.58837890625, 1.799072265625, 2.009765625, 2.220458984375, 2.43115234375, 2.641845703125, 2.8525390625, 3.063232421875, 3.27392578125, 3.484619140625, 3.6953125, 3.906005859375, 4.11669921875, 4.327392578125, 4.5380859375, 4.748779296875, 4.95947265625, 5.170166015625, 5.380859375, 5.591552734375, 5.80224609375, 6.012939453125, 6.2236328125, 6.434326171875, 6.64501953125, 6.855712890625, 7.06640625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 4.0, 2.0, 7.0, 9.0, 4.0, 24.0, 28.0, 51.0, 50.0, 97.0, 130.0, 182.0, 278.0, 393.0, 677.0, 825.0, 1260.0, 2011.0, 2894.0, 4275.0, 6421.0, 9396.0, 14332.0, 22033.0, 35413.0, 58630.0, 100779.0, 166763.0, 208553.0, 161565.0, 97078.0, 56903.0, 34185.0, 21569.0, 13926.0, 9046.0, 6195.0, 3941.0, 2774.0, 1811.0, 1251.0, 902.0, 601.0, 399.0, 299.0, 195.0, 121.0, 99.0, 62.0, 39.0, 24.0, 29.0, 9.0, 7.0, 9.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.587890625, -0.5692062377929688, -0.5505218505859375, -0.5318374633789062, -0.513153076171875, -0.49446868896484375, -0.4757843017578125, -0.45709991455078125, -0.43841552734375, -0.41973114013671875, -0.4010467529296875, -0.38236236572265625, -0.363677978515625, -0.34499359130859375, -0.3263092041015625, -0.30762481689453125, -0.2889404296875, -0.27025604248046875, -0.2515716552734375, -0.23288726806640625, -0.214202880859375, -0.19551849365234375, -0.1768341064453125, -0.15814971923828125, -0.13946533203125, -0.12078094482421875, -0.1020965576171875, -0.08341217041015625, -0.064727783203125, -0.04604339599609375, -0.0273590087890625, -0.00867462158203125, 0.010009765625, 0.02869415283203125, 0.0473785400390625, 0.06606292724609375, 0.084747314453125, 0.10343170166015625, 0.1221160888671875, 0.14080047607421875, 0.15948486328125, 0.17816925048828125, 0.1968536376953125, 0.21553802490234375, 0.234222412109375, 0.25290679931640625, 0.2715911865234375, 0.29027557373046875, 0.3089599609375, 0.32764434814453125, 0.3463287353515625, 0.36501312255859375, 0.383697509765625, 0.40238189697265625, 0.4210662841796875, 0.43975067138671875, 0.45843505859375, 0.47711944580078125, 0.4958038330078125, 0.5144882202148438, 0.533172607421875, 0.5518569946289062, 0.5705413818359375, 0.5892257690429688, 0.60791015625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 7.0, 4.0, 6.0, 11.0, 6.0, 19.0, 21.0, 13.0, 18.0, 27.0, 31.0, 40.0, 29.0, 27.0, 37.0, 32.0, 41.0, 40.0, 41.0, 37.0, 1061.0, 46.0, 45.0, 41.0, 33.0, 34.0, 22.0, 28.0, 20.0, 32.0, 29.0, 27.0, 17.0, 8.0, 14.0, 12.0, 7.0, 9.0, 10.0, 12.0, 5.0, 1.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.638671875, -3.513336181640625, -3.38800048828125, -3.262664794921875, -3.1373291015625, -3.011993408203125, -2.88665771484375, -2.761322021484375, -2.635986328125, -2.510650634765625, -2.38531494140625, -2.259979248046875, -2.1346435546875, -2.009307861328125, -1.88397216796875, -1.758636474609375, -1.63330078125, -1.507965087890625, -1.38262939453125, -1.257293701171875, -1.1319580078125, -1.006622314453125, -0.88128662109375, -0.755950927734375, -0.630615234375, -0.505279541015625, -0.37994384765625, -0.254608154296875, -0.1292724609375, -0.003936767578125, 0.12139892578125, 0.246734619140625, 0.3720703125, 0.497406005859375, 0.62274169921875, 0.748077392578125, 0.8734130859375, 0.998748779296875, 1.12408447265625, 1.249420166015625, 1.374755859375, 1.500091552734375, 1.62542724609375, 1.750762939453125, 1.8760986328125, 2.001434326171875, 2.12677001953125, 2.252105712890625, 2.37744140625, 2.502777099609375, 2.62811279296875, 2.753448486328125, 2.8787841796875, 3.004119873046875, 3.12945556640625, 3.254791259765625, 3.380126953125, 3.505462646484375, 3.63079833984375, 3.756134033203125, 3.8814697265625, 4.006805419921875, 4.13214111328125, 4.257476806640625, 4.3828125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 7.0, 5.0, 12.0, 25.0, 35.0, 59.0, 78.0, 119.0, 191.0, 342.0, 589.0, 916.0, 1710.0, 2957.0, 4991.0, 8835.0, 15831.0, 28187.0, 51953.0, 97323.0, 172863.0, 1282245.0, 188273.0, 108875.0, 58476.0, 31445.0, 17703.0, 9919.0, 5491.0, 3143.0, 1823.0, 1055.0, 609.0, 401.0, 233.0, 152.0, 97.0, 57.0, 38.0, 25.0, 14.0, 5.0, 11.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.6199188232421875, -0.598236083984375, -0.5765533447265625, -0.55487060546875, -0.5331878662109375, -0.511505126953125, -0.4898223876953125, -0.4681396484375, -0.4464569091796875, -0.424774169921875, -0.4030914306640625, -0.38140869140625, -0.3597259521484375, -0.338043212890625, -0.3163604736328125, -0.294677734375, -0.2729949951171875, -0.251312255859375, -0.2296295166015625, -0.20794677734375, -0.1862640380859375, -0.164581298828125, -0.1428985595703125, -0.1212158203125, -0.0995330810546875, -0.077850341796875, -0.0561676025390625, -0.03448486328125, -0.0128021240234375, 0.008880615234375, 0.0305633544921875, 0.05224609375, 0.0739288330078125, 0.095611572265625, 0.1172943115234375, 0.13897705078125, 0.1606597900390625, 0.182342529296875, 0.2040252685546875, 0.2257080078125, 0.2473907470703125, 0.269073486328125, 0.2907562255859375, 0.31243896484375, 0.3341217041015625, 0.355804443359375, 0.3774871826171875, 0.399169921875, 0.4208526611328125, 0.442535400390625, 0.4642181396484375, 0.48590087890625, 0.5075836181640625, 0.529266357421875, 0.5509490966796875, 0.5726318359375, 0.5943145751953125, 0.615997314453125, 0.6376800537109375, 0.65936279296875, 0.6810455322265625, 0.702728271484375, 0.7244110107421875, 0.74609375]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 4.0, 4.0, 7.0, 11.0, 11.0, 12.0, 19.0, 25.0, 22.0, 29.0, 40.0, 41.0, 37.0, 51.0, 45.0, 54.0, 64.0, 58.0, 51.0, 65.0, 52.0, 64.0, 43.0, 35.0, 28.0, 29.0, 17.0, 16.0, 8.0, 13.0, 14.0, 3.0, 7.0, 7.0, 0.0, 4.0, 1.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0019855499267578125, -0.001920849084854126, -0.0018561482429504395, -0.001791447401046753, -0.0017267465591430664, -0.0016620457172393799, -0.0015973448753356934, -0.0015326440334320068, -0.0014679431915283203, -0.0014032423496246338, -0.0013385415077209473, -0.0012738406658172607, -0.0012091398239135742, -0.0011444389820098877, -0.0010797381401062012, -0.0010150372982025146, -0.0009503364562988281, -0.0008856356143951416, -0.0008209347724914551, -0.0007562339305877686, -0.000691533088684082, -0.0006268322467803955, -0.000562131404876709, -0.0004974305629730225, -0.00043272972106933594, -0.0003680288791656494, -0.0003033280372619629, -0.00023862719535827637, -0.00017392635345458984, -0.00010922551155090332, -4.45246696472168e-05, 2.0176172256469727e-05, 8.487701416015625e-05, 0.00014957785606384277, 0.0002142786979675293, 0.0002789795398712158, 0.00034368038177490234, 0.00040838122367858887, 0.0004730820655822754, 0.0005377829074859619, 0.0006024837493896484, 0.000667184591293335, 0.0007318854331970215, 0.000796586275100708, 0.0008612871170043945, 0.0009259879589080811, 0.0009906888008117676, 0.001055389642715454, 0.0011200904846191406, 0.0011847913265228271, 0.0012494921684265137, 0.0013141930103302002, 0.0013788938522338867, 0.0014435946941375732, 0.0015082955360412598, 0.0015729963779449463, 0.0016376972198486328, 0.0017023980617523193, 0.0017670989036560059, 0.0018317997455596924, 0.001896500587463379, 0.0019612014293670654, 0.002025902271270752, 0.0020906031131744385, 0.002155303955078125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 1.0, 9.0, 12.0, 16.0, 15.0, 23.0, 35.0, 40.0, 47.0, 76.0, 100.0, 134.0, 217.0, 393.0, 635.0, 1467.0, 763501.0, 278757.0, 1197.0, 638.0, 390.0, 215.0, 150.0, 104.0, 74.0, 67.0, 58.0, 49.0, 34.0, 18.0, 17.0, 13.0, 6.0, 7.0, 8.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.04193115234375, -0.040617942810058594, -0.03930473327636719, -0.03799152374267578, -0.036678314208984375, -0.03536510467529297, -0.03405189514160156, -0.032738685607910156, -0.03142547607421875, -0.030112266540527344, -0.028799057006835938, -0.02748584747314453, -0.026172637939453125, -0.02485942840576172, -0.023546218872070312, -0.022233009338378906, -0.0209197998046875, -0.019606590270996094, -0.018293380737304688, -0.01698017120361328, -0.015666961669921875, -0.014353752136230469, -0.013040542602539062, -0.011727333068847656, -0.01041412353515625, -0.009100914001464844, -0.0077877044677734375, -0.006474494934082031, -0.005161285400390625, -0.0038480758666992188, -0.0025348663330078125, -0.0012216567993164062, 9.1552734375e-05, 0.0014047622680664062, 0.0027179718017578125, 0.004031181335449219, 0.005344390869140625, 0.006657600402832031, 0.007970809936523438, 0.009284019470214844, 0.01059722900390625, 0.011910438537597656, 0.013223648071289062, 0.014536857604980469, 0.015850067138671875, 0.01716327667236328, 0.018476486206054688, 0.019789695739746094, 0.0211029052734375, 0.022416114807128906, 0.023729324340820312, 0.02504253387451172, 0.026355743408203125, 0.02766895294189453, 0.028982162475585938, 0.030295372009277344, 0.03160858154296875, 0.032921791076660156, 0.03423500061035156, 0.03554821014404297, 0.036861419677734375, 0.03817462921142578, 0.03948783874511719, 0.040801048278808594, 0.0421142578125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [6.0, 153.0, 723.0, 129.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005555703537538648, -0.0003293518384452909, -0.00010313332313671708, 0.00012308522127568722, 0.0003493037074804306, 0.000575522193685174, 0.0008017407963052392, 0.0010279592825099826, 0.001254177768714726, 0.0014803962549194694, 0.0017066148575395346, 0.001932833343744278, 0.0021590518299490213, 0.0023852703161537647, 0.0026114890351891518, 0.0028377072885632515, 0.0030639260075986385, 0.003290144493803382, 0.0035163629800081253, 0.0037425816990435123, 0.003968799952417612, 0.004195018671452999, 0.004421236924827099, 0.004647455643862486, 0.004873673897236586, 0.005099892616271973, 0.005326110869646072, 0.005552329588681459, 0.005778547842055559, 0.006004766561090946, 0.006230984814465046, 0.006457203533500433, 0.00668342225253582, 0.006909640971571207, 0.007135859224945307, 0.007362077943980694, 0.0075882961973547935, 0.007814514450728893, 0.008040733635425568, 0.008266951888799667, 0.008493170142173767, 0.008719388395547867, 0.008945607580244541, 0.009171825833618641, 0.00939804408699274, 0.00962426234036684, 0.009850481525063515, 0.010076699778437614, 0.010302918031811714, 0.010529136285185814, 0.010755355469882488, 0.010981573723256588, 0.011207791976630688, 0.011434010230004787, 0.011660229414701462, 0.011886447668075562, 0.012112666852772236, 0.012338885106146336, 0.01256510429084301, 0.01279132254421711, 0.01301754079759121, 0.01324375905096531, 0.013469978235661983, 0.013696196489036083, 0.013922414742410183]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 8.0, 7.0, 4.0, 7.0, 8.0, 17.0, 13.0, 21.0, 12.0, 21.0, 23.0, 17.0, 28.0, 26.0, 25.0, 24.0, 32.0, 42.0, 63.0, 30.0, 31.0, 33.0, 44.0, 45.0, 39.0, 40.0, 24.0, 26.0, 33.0, 27.0, 24.0, 29.0, 22.0, 17.0, 22.0, 22.0, 19.0, 16.0, 11.0, 13.0, 10.0, 3.0, 7.0, 5.0, 2.0, 4.0, 1.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.0009876489639282227, -0.0009566610679030418, -0.000925673171877861, -0.0008946852758526802, -0.0008636973798274994, -0.0008327094838023186, -0.0008017215877771378, -0.0007707336917519569, -0.0007397457957267761, -0.0007087578997015953, -0.0006777700036764145, -0.0006467821076512337, -0.0006157942116260529, -0.000584806315600872, -0.0005538184195756912, -0.0005228305235505104, -0.0004918426275253296, -0.0004608547315001488, -0.00042986683547496796, -0.00039887893944978714, -0.0003678910434246063, -0.0003369031473994255, -0.0003059152513742447, -0.0002749273553490639, -0.00024393945932388306, -0.00021295156329870224, -0.00018196366727352142, -0.0001509757712483406, -0.00011998787522315979, -8.899997919797897e-05, -5.801208317279816e-05, -2.702418714761734e-05, 3.9637088775634766e-06, 3.495160490274429e-05, 6.593950092792511e-05, 9.692739695310593e-05, 0.00012791529297828674, 0.00015890318900346756, 0.00018989108502864838, 0.0002208789810538292, 0.00025186687707901, 0.0002828547731041908, 0.00031384266912937164, 0.00034483056515455246, 0.0003758184611797333, 0.0004068063572049141, 0.0004377942532300949, 0.0004687821492552757, 0.0004997700452804565, 0.0005307579413056374, 0.0005617458373308182, 0.000592733733355999, 0.0006237216293811798, 0.0006547095254063606, 0.0006856974214315414, 0.0007166853174567223, 0.0007476732134819031, 0.0007786611095070839, 0.0008096490055322647, 0.0008406369015574455, 0.0008716247975826263, 0.0009026126936078072, 0.000933600589632988, 0.0009645884856581688, 0.0009955763816833496]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 5.0, 6.0, 4.0, 7.0, 12.0, 12.0, 14.0, 11.0, 22.0, 17.0, 24.0, 30.0, 30.0, 34.0, 34.0, 39.0, 39.0, 42.0, 51.0, 46.0, 49.0, 49.0, 34.0, 44.0, 38.0, 41.0, 44.0, 30.0, 28.0, 20.0, 32.0, 22.0, 23.0, 12.0, 6.0, 17.0, 6.0, 3.0, 3.0, 5.0, 3.0, 4.0, 8.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.41796875, -6.207275390625, -5.99658203125, -5.785888671875, -5.5751953125, -5.364501953125, -5.15380859375, -4.943115234375, -4.732421875, -4.521728515625, -4.31103515625, -4.100341796875, -3.8896484375, -3.678955078125, -3.46826171875, -3.257568359375, -3.046875, -2.836181640625, -2.62548828125, -2.414794921875, -2.2041015625, -1.993408203125, -1.78271484375, -1.572021484375, -1.361328125, -1.150634765625, -0.93994140625, -0.729248046875, -0.5185546875, -0.307861328125, -0.09716796875, 0.113525390625, 0.32421875, 0.534912109375, 0.74560546875, 0.956298828125, 1.1669921875, 1.377685546875, 1.58837890625, 1.799072265625, 2.009765625, 2.220458984375, 2.43115234375, 2.641845703125, 2.8525390625, 3.063232421875, 3.27392578125, 3.484619140625, 3.6953125, 3.906005859375, 4.11669921875, 4.327392578125, 4.5380859375, 4.748779296875, 4.95947265625, 5.170166015625, 5.380859375, 5.591552734375, 5.80224609375, 6.012939453125, 6.2236328125, 6.434326171875, 6.64501953125, 6.855712890625, 7.06640625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 10.0, 8.0, 7.0, 14.0, 20.0, 28.0, 33.0, 48.0, 66.0, 85.0, 137.0, 159.0, 219.0, 311.0, 462.0, 681.0, 1002.0, 1459.0, 2368.0, 4964.0, 15655.0, 104446.0, 690215.0, 188656.0, 23224.0, 6169.0, 2864.0, 1671.0, 1068.0, 693.0, 478.0, 379.0, 298.0, 184.0, 119.0, 94.0, 73.0, 56.0, 25.0, 28.0, 26.0, 22.0, 6.0, 7.0, 7.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-17.296875, -16.782470703125, -16.26806640625, -15.753662109375, -15.2392578125, -14.724853515625, -14.21044921875, -13.696044921875, -13.181640625, -12.667236328125, -12.15283203125, -11.638427734375, -11.1240234375, -10.609619140625, -10.09521484375, -9.580810546875, -9.06640625, -8.552001953125, -8.03759765625, -7.523193359375, -7.0087890625, -6.494384765625, -5.97998046875, -5.465576171875, -4.951171875, -4.436767578125, -3.92236328125, -3.407958984375, -2.8935546875, -2.379150390625, -1.86474609375, -1.350341796875, -0.8359375, -0.321533203125, 0.19287109375, 0.707275390625, 1.2216796875, 1.736083984375, 2.25048828125, 2.764892578125, 3.279296875, 3.793701171875, 4.30810546875, 4.822509765625, 5.3369140625, 5.851318359375, 6.36572265625, 6.880126953125, 7.39453125, 7.908935546875, 8.42333984375, 8.937744140625, 9.4521484375, 9.966552734375, 10.48095703125, 10.995361328125, 11.509765625, 12.024169921875, 12.53857421875, 13.052978515625, 13.5673828125, 14.081787109375, 14.59619140625, 15.110595703125, 15.625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 7.0, 6.0, 9.0, 12.0, 8.0, 11.0, 20.0, 13.0, 26.0, 14.0, 26.0, 38.0, 41.0, 41.0, 51.0, 65.0, 96.0, 249.0, 1561.0, 240.0, 96.0, 50.0, 58.0, 51.0, 33.0, 29.0, 29.0, 24.0, 19.0, 14.0, 19.0, 15.0, 12.0, 7.0, 9.0, 7.0, 6.0, 6.0, 6.0, 4.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-17.328125, -16.8533935546875, -16.378662109375, -15.9039306640625, -15.42919921875, -14.9544677734375, -14.479736328125, -14.0050048828125, -13.5302734375, -13.0555419921875, -12.580810546875, -12.1060791015625, -11.63134765625, -11.1566162109375, -10.681884765625, -10.2071533203125, -9.732421875, -9.2576904296875, -8.782958984375, -8.3082275390625, -7.83349609375, -7.3587646484375, -6.884033203125, -6.4093017578125, -5.9345703125, -5.4598388671875, -4.985107421875, -4.5103759765625, -4.03564453125, -3.5609130859375, -3.086181640625, -2.6114501953125, -2.13671875, -1.6619873046875, -1.187255859375, -0.7125244140625, -0.23779296875, 0.2369384765625, 0.711669921875, 1.1864013671875, 1.6611328125, 2.1358642578125, 2.610595703125, 3.0853271484375, 3.56005859375, 4.0347900390625, 4.509521484375, 4.9842529296875, 5.458984375, 5.9337158203125, 6.408447265625, 6.8831787109375, 7.35791015625, 7.8326416015625, 8.307373046875, 8.7821044921875, 9.2568359375, 9.7315673828125, 10.206298828125, 10.6810302734375, 11.15576171875, 11.6304931640625, 12.105224609375, 12.5799560546875, 13.0546875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 7.0, 4.0, 7.0, 11.0, 15.0, 18.0, 20.0, 33.0, 43.0, 51.0, 83.0, 88.0, 144.0, 213.0, 362.0, 699.0, 1929.0, 817617.0, 2320482.0, 2076.0, 715.0, 317.0, 240.0, 145.0, 94.0, 60.0, 53.0, 43.0, 35.0, 27.0, 23.0, 7.0, 8.0, 13.0, 6.0, 3.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.25, -45.6220703125, -43.994140625, -42.3662109375, -40.73828125, -39.1103515625, -37.482421875, -35.8544921875, -34.2265625, -32.5986328125, -30.970703125, -29.3427734375, -27.71484375, -26.0869140625, -24.458984375, -22.8310546875, -21.203125, -19.5751953125, -17.947265625, -16.3193359375, -14.69140625, -13.0634765625, -11.435546875, -9.8076171875, -8.1796875, -6.5517578125, -4.923828125, -3.2958984375, -1.66796875, -0.0400390625, 1.587890625, 3.2158203125, 4.84375, 6.4716796875, 8.099609375, 9.7275390625, 11.35546875, 12.9833984375, 14.611328125, 16.2392578125, 17.8671875, 19.4951171875, 21.123046875, 22.7509765625, 24.37890625, 26.0068359375, 27.634765625, 29.2626953125, 30.890625, 32.5185546875, 34.146484375, 35.7744140625, 37.40234375, 39.0302734375, 40.658203125, 42.2861328125, 43.9140625, 45.5419921875, 47.169921875, 48.7978515625, 50.42578125, 52.0537109375, 53.681640625, 55.3095703125, 56.9375]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 57.0, 223.0, 416.0, 248.0, 51.0, 10.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-172.0075225830078, -168.85704040527344, -165.70654296875, -162.55606079101562, -159.40557861328125, -156.25509643554688, -153.10459899902344, -149.95411682128906, -146.8036346435547, -143.6531524658203, -140.50265502929688, -137.3521728515625, -134.20169067382812, -131.05120849609375, -127.90071105957031, -124.75022888183594, -121.59973907470703, -118.44924926757812, -115.29876708984375, -112.14827728271484, -108.99779510498047, -105.84730529785156, -102.69682312011719, -99.54633331298828, -96.39584350585938, -93.24535369873047, -90.0948715209961, -86.94438171386719, -83.79389953613281, -80.6434097290039, -77.492919921875, -74.34243774414062, -71.19195556640625, -68.04146575927734, -64.89098358154297, -61.74049377441406, -58.59001159667969, -55.43952178955078, -52.28903579711914, -49.1385498046875, -45.988059997558594, -42.83757400512695, -39.68708801269531, -36.536598205566406, -33.38611602783203, -30.235628128051758, -27.085140228271484, -23.934654235839844, -20.784170150756836, -17.633684158325195, -14.483197212219238, -11.332710266113281, -8.18222427368164, -5.03173828125, -1.8812503814697266, 1.269235610961914, 4.419721603393555, 7.5702080726623535, 10.720694541931152, 13.87118148803711, 17.02166748046875, 20.17215347290039, 23.322641372680664, 26.473127365112305, 29.623613357543945]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 9.0, 7.0, 8.0, 17.0, 20.0, 14.0, 18.0, 21.0, 27.0, 31.0, 25.0, 29.0, 26.0, 36.0, 50.0, 41.0, 38.0, 40.0, 51.0, 39.0, 43.0, 35.0, 38.0, 37.0, 31.0, 38.0, 30.0, 31.0, 22.0, 20.0, 18.0, 19.0, 18.0, 15.0, 12.0, 5.0, 7.0, 4.0, 9.0, 8.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-48.33363342285156, -46.94134521484375, -45.54905700683594, -44.156768798828125, -42.76448059082031, -41.372188568115234, -39.97990036010742, -38.58761215209961, -37.1953239440918, -35.803035736083984, -34.41074752807617, -33.01845932006836, -31.626169204711914, -30.2338809967041, -28.841590881347656, -27.449302673339844, -26.05701446533203, -24.66472625732422, -23.272438049316406, -21.88014793395996, -20.48785972595215, -19.095571517944336, -17.70328140258789, -16.310993194580078, -14.918704986572266, -13.526416778564453, -12.134127616882324, -10.741838455200195, -9.349550247192383, -7.957261562347412, -6.564972877502441, -5.1726837158203125, -3.7803993225097656, -2.388110637664795, -0.9958219528198242, 0.3964667320251465, 1.7887554168701172, 3.181044101715088, 4.573332786560059, 5.9656219482421875, 7.35791015625, 8.750198364257812, 10.142487525939941, 11.53477668762207, 12.927064895629883, 14.319353103637695, 15.711642265319824, 17.103931427001953, 18.496219635009766, 19.888507843017578, 21.28079605102539, 22.673086166381836, 24.06537437438965, 25.45766258239746, 26.849952697753906, 28.24224090576172, 29.63452911376953, 31.026817321777344, 32.419105529785156, 33.81139373779297, 35.20368194580078, 36.59597396850586, 37.98826217651367, 39.380550384521484, 40.7728385925293]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 6.0, 2.0, 6.0, 8.0, 10.0, 8.0, 8.0, 11.0, 11.0, 15.0, 28.0, 20.0, 19.0, 41.0, 34.0, 41.0, 39.0, 43.0, 30.0, 35.0, 44.0, 51.0, 38.0, 46.0, 38.0, 30.0, 41.0, 45.0, 38.0, 24.0, 22.0, 41.0, 20.0, 13.0, 12.0, 24.0, 11.0, 9.0, 12.0, 4.0, 8.0, 6.0, 2.0, 5.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.328125, -6.10919189453125, -5.8902587890625, -5.67132568359375, -5.452392578125, -5.23345947265625, -5.0145263671875, -4.79559326171875, -4.57666015625, -4.35772705078125, -4.1387939453125, -3.91986083984375, -3.700927734375, -3.48199462890625, -3.2630615234375, -3.04412841796875, -2.8251953125, -2.60626220703125, -2.3873291015625, -2.16839599609375, -1.949462890625, -1.73052978515625, -1.5115966796875, -1.29266357421875, -1.07373046875, -0.85479736328125, -0.6358642578125, -0.41693115234375, -0.197998046875, 0.02093505859375, 0.2398681640625, 0.45880126953125, 0.677734375, 0.89666748046875, 1.1156005859375, 1.33453369140625, 1.553466796875, 1.77239990234375, 1.9913330078125, 2.21026611328125, 2.42919921875, 2.64813232421875, 2.8670654296875, 3.08599853515625, 3.304931640625, 3.52386474609375, 3.7427978515625, 3.96173095703125, 4.1806640625, 4.39959716796875, 4.6185302734375, 4.83746337890625, 5.056396484375, 5.27532958984375, 5.4942626953125, 5.71319580078125, 5.93212890625, 6.15106201171875, 6.3699951171875, 6.58892822265625, 6.807861328125, 7.02679443359375, 7.2457275390625, 7.46466064453125, 7.68359375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 10.0, 11.0, 13.0, 25.0, 30.0, 26.0, 48.0, 63.0, 99.0, 146.0, 154.0, 229.0, 324.0, 469.0, 649.0, 930.0, 1380.0, 2121.0, 3279.0, 5763.0, 11206.0, 27858.0, 90910.0, 355331.0, 1090292.0, 1579440.0, 727730.0, 202653.0, 53788.0, 18111.0, 8243.0, 4508.0, 2700.0, 1773.0, 1122.0, 794.0, 590.0, 408.0, 293.0, 197.0, 140.0, 116.0, 96.0, 56.0, 36.0, 37.0, 21.0, 23.0, 16.0, 6.0, 9.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-7.55078125, -7.31695556640625, -7.0831298828125, -6.84930419921875, -6.615478515625, -6.38165283203125, -6.1478271484375, -5.91400146484375, -5.68017578125, -5.44635009765625, -5.2125244140625, -4.97869873046875, -4.744873046875, -4.51104736328125, -4.2772216796875, -4.04339599609375, -3.8095703125, -3.57574462890625, -3.3419189453125, -3.10809326171875, -2.874267578125, -2.64044189453125, -2.4066162109375, -2.17279052734375, -1.93896484375, -1.70513916015625, -1.4713134765625, -1.23748779296875, -1.003662109375, -0.76983642578125, -0.5360107421875, -0.30218505859375, -0.068359375, 0.16546630859375, 0.3992919921875, 0.63311767578125, 0.866943359375, 1.10076904296875, 1.3345947265625, 1.56842041015625, 1.80224609375, 2.03607177734375, 2.2698974609375, 2.50372314453125, 2.737548828125, 2.97137451171875, 3.2052001953125, 3.43902587890625, 3.6728515625, 3.90667724609375, 4.1405029296875, 4.37432861328125, 4.608154296875, 4.84197998046875, 5.0758056640625, 5.30963134765625, 5.54345703125, 5.77728271484375, 6.0111083984375, 6.24493408203125, 6.478759765625, 6.71258544921875, 6.9464111328125, 7.18023681640625, 7.4140625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 22.0, 35.0, 92.0, 241.0, 564.0, 1237.0, 1055.0, 475.0, 229.0, 78.0, 34.0, 9.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.15625, -35.119384765625, -34.08251953125, -33.045654296875, -32.0087890625, -30.971923828125, -29.93505859375, -28.898193359375, -27.861328125, -26.824462890625, -25.78759765625, -24.750732421875, -23.7138671875, -22.677001953125, -21.64013671875, -20.603271484375, -19.56640625, -18.529541015625, -17.49267578125, -16.455810546875, -15.4189453125, -14.382080078125, -13.34521484375, -12.308349609375, -11.271484375, -10.234619140625, -9.19775390625, -8.160888671875, -7.1240234375, -6.087158203125, -5.05029296875, -4.013427734375, -2.9765625, -1.939697265625, -0.90283203125, 0.134033203125, 1.1708984375, 2.207763671875, 3.24462890625, 4.281494140625, 5.318359375, 6.355224609375, 7.39208984375, 8.428955078125, 9.4658203125, 10.502685546875, 11.53955078125, 12.576416015625, 13.61328125, 14.650146484375, 15.68701171875, 16.723876953125, 17.7607421875, 18.797607421875, 19.83447265625, 20.871337890625, 21.908203125, 22.945068359375, 23.98193359375, 25.018798828125, 26.0556640625, 27.092529296875, 28.12939453125, 29.166259765625, 30.203125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 18.0, 36.0, 78.0, 195.0, 542.0, 1455.0, 9927.0, 4149993.0, 29147.0, 1860.0, 616.0, 233.0, 86.0, 47.0, 12.0, 10.0, 5.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.71875, -51.84033203125, -49.9619140625, -48.08349609375, -46.205078125, -44.32666015625, -42.4482421875, -40.56982421875, -38.69140625, -36.81298828125, -34.9345703125, -33.05615234375, -31.177734375, -29.29931640625, -27.4208984375, -25.54248046875, -23.6640625, -21.78564453125, -19.9072265625, -18.02880859375, -16.150390625, -14.27197265625, -12.3935546875, -10.51513671875, -8.63671875, -6.75830078125, -4.8798828125, -3.00146484375, -1.123046875, 0.75537109375, 2.6337890625, 4.51220703125, 6.390625, 8.26904296875, 10.1474609375, 12.02587890625, 13.904296875, 15.78271484375, 17.6611328125, 19.53955078125, 21.41796875, 23.29638671875, 25.1748046875, 27.05322265625, 28.931640625, 30.81005859375, 32.6884765625, 34.56689453125, 36.4453125, 38.32373046875, 40.2021484375, 42.08056640625, 43.958984375, 45.83740234375, 47.7158203125, 49.59423828125, 51.47265625, 53.35107421875, 55.2294921875, 57.10791015625, 58.986328125, 60.86474609375, 62.7431640625, 64.62158203125, 66.5]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 14.0, 282.0, 660.0, 59.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-459.8144836425781, -451.0070495605469, -442.1996154785156, -433.3921813964844, -424.5847473144531, -415.7773132324219, -406.9698791503906, -398.16241455078125, -389.35498046875, -380.54754638671875, -371.7401123046875, -362.93267822265625, -354.125244140625, -345.31781005859375, -336.5103759765625, -327.70294189453125, -318.8955078125, -310.08807373046875, -301.2806396484375, -292.47320556640625, -283.665771484375, -274.85833740234375, -266.0509033203125, -257.24346923828125, -248.43601989746094, -239.6285858154297, -230.82115173339844, -222.0137176513672, -213.20626831054688, -204.39883422851562, -195.59140014648438, -186.78396606445312, -177.9765625, -169.16912841796875, -160.3616943359375, -151.55426025390625, -142.746826171875, -133.93939208984375, -125.13194274902344, -116.32450866699219, -107.51707458496094, -98.70964050292969, -89.90220642089844, -81.09476470947266, -72.2873306274414, -63.479896545410156, -54.67245864868164, -45.865020751953125, -37.057586669921875, -28.250150680541992, -19.44271469116211, -10.635278701782227, -1.8278427124023438, 6.979591369628906, 15.787029266357422, 24.594467163085938, 33.40190124511719, 42.20933532714844, 51.01677322387695, 59.82421112060547, 68.63164520263672, 77.43907928466797, 86.24652099609375, 95.053955078125, 103.86138916015625]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 10.0, 14.0, 9.0, 8.0, 14.0, 9.0, 22.0, 25.0, 23.0, 22.0, 29.0, 26.0, 35.0, 31.0, 35.0, 37.0, 32.0, 45.0, 41.0, 32.0, 55.0, 45.0, 36.0, 42.0, 31.0, 33.0, 31.0, 34.0, 25.0, 23.0, 19.0, 19.0, 22.0, 14.0, 11.0, 14.0, 13.0, 7.0, 3.0, 5.0, 0.0, 4.0, 6.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-47.485198974609375, -46.136837005615234, -44.78847885131836, -43.44011688232422, -42.09175491333008, -40.74339294433594, -39.39503479003906, -38.04667282104492, -36.69831085205078, -35.34994888305664, -34.001590728759766, -32.653228759765625, -31.304866790771484, -29.956506729125977, -28.60814666748047, -27.259784698486328, -25.911426544189453, -24.563066482543945, -23.214704513549805, -21.866344451904297, -20.517982482910156, -19.16962242126465, -17.82126235961914, -16.472900390625, -15.124540328979492, -13.776179313659668, -12.427818298339844, -11.079458236694336, -9.731097221374512, -8.382736206054688, -7.03437614440918, -5.6860151290893555, -4.337654113769531, -2.989293336868286, -1.640932559967041, -0.292572021484375, 1.0557889938354492, 2.4041500091552734, 3.7525100708007812, 5.1008710861206055, 6.44923210144043, 7.797593116760254, 9.145954132080078, 10.494314193725586, 11.84267520904541, 13.191036224365234, 14.539396286010742, 15.887757301330566, 17.23611831665039, 18.5844783782959, 19.93284034729004, 21.281200408935547, 22.629562377929688, 23.977922439575195, 25.326282501220703, 26.674644470214844, 28.02300453186035, 29.37136459350586, 30.7197265625, 32.068084716796875, 33.416446685791016, 34.764808654785156, 36.11316680908203, 37.46152877807617, 38.80989074707031]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 3.0, 6.0, 9.0, 8.0, 9.0, 6.0, 14.0, 12.0, 11.0, 17.0, 16.0, 18.0, 15.0, 25.0, 24.0, 39.0, 40.0, 30.0, 45.0, 38.0, 47.0, 47.0, 42.0, 31.0, 41.0, 36.0, 30.0, 42.0, 24.0, 21.0, 28.0, 23.0, 37.0, 24.0, 21.0, 19.0, 18.0, 10.0, 20.0, 3.0, 10.0, 12.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.77734375, -4.626220703125, -4.47509765625, -4.323974609375, -4.1728515625, -4.021728515625, -3.87060546875, -3.719482421875, -3.568359375, -3.417236328125, -3.26611328125, -3.114990234375, -2.9638671875, -2.812744140625, -2.66162109375, -2.510498046875, -2.359375, -2.208251953125, -2.05712890625, -1.906005859375, -1.7548828125, -1.603759765625, -1.45263671875, -1.301513671875, -1.150390625, -0.999267578125, -0.84814453125, -0.697021484375, -0.5458984375, -0.394775390625, -0.24365234375, -0.092529296875, 0.05859375, 0.209716796875, 0.36083984375, 0.511962890625, 0.6630859375, 0.814208984375, 0.96533203125, 1.116455078125, 1.267578125, 1.418701171875, 1.56982421875, 1.720947265625, 1.8720703125, 2.023193359375, 2.17431640625, 2.325439453125, 2.4765625, 2.627685546875, 2.77880859375, 2.929931640625, 3.0810546875, 3.232177734375, 3.38330078125, 3.534423828125, 3.685546875, 3.836669921875, 3.98779296875, 4.138916015625, 4.2900390625, 4.441162109375, 4.59228515625, 4.743408203125, 4.89453125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 9.0, 9.0, 24.0, 17.0, 36.0, 54.0, 70.0, 105.0, 152.0, 210.0, 329.0, 512.0, 659.0, 1012.0, 1540.0, 2299.0, 3469.0, 5286.0, 8136.0, 12370.0, 19916.0, 32196.0, 53491.0, 92781.0, 156601.0, 214928.0, 174580.0, 106772.0, 61920.0, 36030.0, 22227.0, 14162.0, 9026.0, 6037.0, 3844.0, 2539.0, 1760.0, 1095.0, 742.0, 511.0, 359.0, 249.0, 146.0, 99.0, 71.0, 68.0, 33.0, 28.0, 15.0, 11.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 2.0], "bins": [-0.53662109375, -0.5196533203125, -0.502685546875, -0.4857177734375, -0.46875, -0.4517822265625, -0.434814453125, -0.4178466796875, -0.40087890625, -0.3839111328125, -0.366943359375, -0.3499755859375, -0.3330078125, -0.3160400390625, -0.299072265625, -0.2821044921875, -0.26513671875, -0.2481689453125, -0.231201171875, -0.2142333984375, -0.197265625, -0.1802978515625, -0.163330078125, -0.1463623046875, -0.12939453125, -0.1124267578125, -0.095458984375, -0.0784912109375, -0.0615234375, -0.0445556640625, -0.027587890625, -0.0106201171875, 0.00634765625, 0.0233154296875, 0.040283203125, 0.0572509765625, 0.07421875, 0.0911865234375, 0.108154296875, 0.1251220703125, 0.14208984375, 0.1590576171875, 0.176025390625, 0.1929931640625, 0.2099609375, 0.2269287109375, 0.243896484375, 0.2608642578125, 0.27783203125, 0.2947998046875, 0.311767578125, 0.3287353515625, 0.345703125, 0.3626708984375, 0.379638671875, 0.3966064453125, 0.41357421875, 0.4305419921875, 0.447509765625, 0.4644775390625, 0.4814453125, 0.4984130859375, 0.515380859375, 0.5323486328125, 0.54931640625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 8.0, 9.0, 9.0, 11.0, 12.0, 16.0, 12.0, 20.0, 14.0, 23.0, 27.0, 23.0, 31.0, 32.0, 37.0, 41.0, 33.0, 41.0, 40.0, 49.0, 1059.0, 33.0, 33.0, 29.0, 46.0, 41.0, 33.0, 34.0, 28.0, 23.0, 16.0, 20.0, 23.0, 18.0, 10.0, 15.0, 14.0, 10.0, 10.0, 2.0, 11.0, 6.0, 3.0, 5.0, 2.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.013671875, -2.9168701171875, -2.820068359375, -2.7232666015625, -2.62646484375, -2.5296630859375, -2.432861328125, -2.3360595703125, -2.2392578125, -2.1424560546875, -2.045654296875, -1.9488525390625, -1.85205078125, -1.7552490234375, -1.658447265625, -1.5616455078125, -1.46484375, -1.3680419921875, -1.271240234375, -1.1744384765625, -1.07763671875, -0.9808349609375, -0.884033203125, -0.7872314453125, -0.6904296875, -0.5936279296875, -0.496826171875, -0.4000244140625, -0.30322265625, -0.2064208984375, -0.109619140625, -0.0128173828125, 0.083984375, 0.1807861328125, 0.277587890625, 0.3743896484375, 0.47119140625, 0.5679931640625, 0.664794921875, 0.7615966796875, 0.8583984375, 0.9552001953125, 1.052001953125, 1.1488037109375, 1.24560546875, 1.3424072265625, 1.439208984375, 1.5360107421875, 1.6328125, 1.7296142578125, 1.826416015625, 1.9232177734375, 2.02001953125, 2.1168212890625, 2.213623046875, 2.3104248046875, 2.4072265625, 2.5040283203125, 2.600830078125, 2.6976318359375, 2.79443359375, 2.8912353515625, 2.988037109375, 3.0848388671875, 3.181640625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 8.0, 10.0, 15.0, 25.0, 33.0, 46.0, 75.0, 136.0, 199.0, 304.0, 484.0, 799.0, 1319.0, 2302.0, 3665.0, 6156.0, 10793.0, 18877.0, 33967.0, 63654.0, 123268.0, 216947.0, 1289776.0, 150649.0, 78890.0, 41251.0, 22204.0, 12702.0, 7502.0, 4308.0, 2575.0, 1631.0, 987.0, 607.0, 357.0, 210.0, 141.0, 89.0, 53.0, 46.0, 35.0, 12.0, 10.0, 7.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.64892578125, -0.6299285888671875, -0.610931396484375, -0.5919342041015625, -0.57293701171875, -0.5539398193359375, -0.534942626953125, -0.5159454345703125, -0.4969482421875, -0.4779510498046875, -0.458953857421875, -0.4399566650390625, -0.42095947265625, -0.4019622802734375, -0.382965087890625, -0.3639678955078125, -0.344970703125, -0.3259735107421875, -0.306976318359375, -0.2879791259765625, -0.26898193359375, -0.2499847412109375, -0.230987548828125, -0.2119903564453125, -0.1929931640625, -0.1739959716796875, -0.154998779296875, -0.1360015869140625, -0.11700439453125, -0.0980072021484375, -0.079010009765625, -0.0600128173828125, -0.041015625, -0.0220184326171875, -0.003021240234375, 0.0159759521484375, 0.03497314453125, 0.0539703369140625, 0.072967529296875, 0.0919647216796875, 0.1109619140625, 0.1299591064453125, 0.148956298828125, 0.1679534912109375, 0.18695068359375, 0.2059478759765625, 0.224945068359375, 0.2439422607421875, 0.262939453125, 0.2819366455078125, 0.300933837890625, 0.3199310302734375, 0.33892822265625, 0.3579254150390625, 0.376922607421875, 0.3959197998046875, 0.4149169921875, 0.4339141845703125, 0.452911376953125, 0.4719085693359375, 0.49090576171875, 0.5099029541015625, 0.528900146484375, 0.5478973388671875, 0.56689453125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 6.0, 4.0, 9.0, 7.0, 6.0, 9.0, 9.0, 20.0, 12.0, 11.0, 17.0, 21.0, 23.0, 18.0, 32.0, 32.0, 35.0, 35.0, 47.0, 26.0, 43.0, 34.0, 42.0, 38.0, 36.0, 39.0, 42.0, 32.0, 33.0, 28.0, 32.0, 30.0, 30.0, 24.0, 17.0, 22.0, 16.0, 18.0, 14.0, 6.0, 9.0, 11.0, 6.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0009398460388183594, -0.0009068027138710022, -0.000873759388923645, -0.0008407160639762878, -0.0008076727390289307, -0.0007746294140815735, -0.0007415860891342163, -0.0007085427641868591, -0.000675499439239502, -0.0006424561142921448, -0.0006094127893447876, -0.0005763694643974304, -0.0005433261394500732, -0.0005102828145027161, -0.0004772394895553589, -0.0004441961646080017, -0.00041115283966064453, -0.00037810951471328735, -0.0003450661897659302, -0.000312022864818573, -0.0002789795398712158, -0.00024593621492385864, -0.00021289288997650146, -0.0001798495650291443, -0.0001468062400817871, -0.00011376291513442993, -8.071959018707275e-05, -4.7676265239715576e-05, -1.4632940292358398e-05, 1.841038465499878e-05, 5.145370960235596e-05, 8.449703454971313e-05, 0.00011754035949707031, 0.0001505836844444275, 0.00018362700939178467, 0.00021667033433914185, 0.000249713659286499, 0.0002827569842338562, 0.0003158003091812134, 0.00034884363412857056, 0.00038188695907592773, 0.0004149302840232849, 0.0004479736089706421, 0.00048101693391799927, 0.0005140602588653564, 0.0005471035838127136, 0.0005801469087600708, 0.000613190233707428, 0.0006462335586547852, 0.0006792768836021423, 0.0007123202085494995, 0.0007453635334968567, 0.0007784068584442139, 0.000811450183391571, 0.0008444935083389282, 0.0008775368332862854, 0.0009105801582336426, 0.0009436234831809998, 0.000976666808128357, 0.0010097101330757141, 0.0010427534580230713, 0.0010757967829704285, 0.0011088401079177856, 0.0011418834328651428, 0.0011749267578125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 7.0, 6.0, 6.0, 18.0, 19.0, 27.0, 36.0, 40.0, 41.0, 59.0, 87.0, 90.0, 132.0, 205.0, 279.0, 398.0, 558.0, 1008.0, 11091.0, 1027635.0, 4185.0, 863.0, 522.0, 336.0, 227.0, 181.0, 111.0, 92.0, 64.0, 51.0, 42.0, 29.0, 26.0, 23.0, 13.0, 16.0, 9.0, 6.0, 7.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0263519287109375, -0.025563478469848633, -0.024775028228759766, -0.0239865779876709, -0.02319812774658203, -0.022409677505493164, -0.021621227264404297, -0.02083277702331543, -0.020044326782226562, -0.019255876541137695, -0.018467426300048828, -0.01767897605895996, -0.016890525817871094, -0.016102075576782227, -0.01531362533569336, -0.014525175094604492, -0.013736724853515625, -0.012948274612426758, -0.01215982437133789, -0.011371374130249023, -0.010582923889160156, -0.009794473648071289, -0.009006023406982422, -0.008217573165893555, -0.0074291229248046875, -0.00664067268371582, -0.005852222442626953, -0.005063772201538086, -0.004275321960449219, -0.0034868717193603516, -0.0026984214782714844, -0.0019099712371826172, -0.00112152099609375, -0.0003330707550048828, 0.0004553794860839844, 0.0012438297271728516, 0.0020322799682617188, 0.002820730209350586, 0.003609180450439453, 0.00439763069152832, 0.0051860809326171875, 0.005974531173706055, 0.006762981414794922, 0.007551431655883789, 0.008339881896972656, 0.009128332138061523, 0.00991678237915039, 0.010705232620239258, 0.011493682861328125, 0.012282133102416992, 0.01307058334350586, 0.013859033584594727, 0.014647483825683594, 0.015435934066772461, 0.016224384307861328, 0.017012834548950195, 0.017801284790039062, 0.01858973503112793, 0.019378185272216797, 0.020166635513305664, 0.02095508575439453, 0.0217435359954834, 0.022531986236572266, 0.023320436477661133, 0.02410888671875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [16.0, 366.0, 557.0, 77.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003155087761115283, -0.00016887449601199478, -2.224021591246128e-05, 0.000124394049635157, 0.0002710283442866057, 0.00041766263893805444, 0.0005642968462780118, 0.0007109311409294605, 0.0008575654355809093, 0.001004199730232358, 0.0011508340248838067, 0.0012974683195352554, 0.0014441024977713823, 0.0015907369088381529, 0.0017373710870742798, 0.0018840053817257285, 0.0020306396763771772, 0.002177273854613304, 0.0023239082656800747, 0.0024705424439162016, 0.002617176854982972, 0.002763811033219099, 0.0029104454442858696, 0.0030570796225219965, 0.003203714033588767, 0.003350348211824894, 0.0034969826228916645, 0.0036436168011277914, 0.003790251212194562, 0.003936885390430689, 0.004083519801497459, 0.004230153746902943, 0.004376788157969713, 0.004523422569036484, 0.004670056514441967, 0.0048166909255087376, 0.004963325336575508, 0.005109959747642279, 0.005256593693047762, 0.0054032281041145325, 0.005549862515181303, 0.005696496926248074, 0.005843130871653557, 0.005989765282720327, 0.006136399693787098, 0.0062830341048538685, 0.006429668050259352, 0.006576302461326122, 0.0067229364067316055, 0.006869570817798376, 0.007016204763203859, 0.00716283917427063, 0.0073094735853374004, 0.007456107996404171, 0.007602741941809654, 0.007749376352876425, 0.007896010763943195, 0.008042644709348679, 0.008189279586076736, 0.00833591353148222, 0.008482547476887703, 0.00862918235361576, 0.008775816299021244, 0.008922450244426727, 0.009069085121154785]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 4.0, 11.0, 13.0, 10.0, 13.0, 14.0, 12.0, 20.0, 24.0, 15.0, 27.0, 22.0, 31.0, 27.0, 26.0, 32.0, 32.0, 36.0, 37.0, 35.0, 39.0, 34.0, 30.0, 37.0, 38.0, 42.0, 44.0, 31.0, 23.0, 29.0, 23.0, 20.0, 24.0, 17.0, 17.0, 10.0, 19.0, 15.0, 18.0, 5.0, 4.0, 9.0, 9.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0005914568901062012, -0.000571046955883503, -0.0005506370216608047, -0.0005302270874381065, -0.0005098171532154083, -0.0004894072189927101, -0.0004689972847700119, -0.0004485873505473137, -0.0004281774163246155, -0.00040776748210191727, -0.00038735754787921906, -0.00036694761365652084, -0.00034653767943382263, -0.0003261277452111244, -0.0003057178109884262, -0.000285307876765728, -0.0002648979425430298, -0.0002444880083203316, -0.00022407807409763336, -0.00020366813987493515, -0.00018325820565223694, -0.00016284827142953873, -0.00014243833720684052, -0.0001220284029841423, -0.00010161846876144409, -8.120853453874588e-05, -6.079860031604767e-05, -4.038866609334946e-05, -1.9978731870651245e-05, 4.3120235204696655e-07, 2.0841136574745178e-05, 4.125107079744339e-05, 6.16610050201416e-05, 8.207093924283981e-05, 0.00010248087346553802, 0.00012289080768823624, 0.00014330074191093445, 0.00016371067613363266, 0.00018412061035633087, 0.00020453054457902908, 0.0002249404788017273, 0.0002453504130244255, 0.0002657603472471237, 0.00028617028146982193, 0.00030658021569252014, 0.00032699014991521835, 0.00034740008413791656, 0.0003678100183606148, 0.000388219952583313, 0.0004086298868060112, 0.0004290398210287094, 0.0004494497552514076, 0.00046985968947410583, 0.000490269623696804, 0.0005106795579195023, 0.0005310894921422005, 0.0005514994263648987, 0.0005719093605875969, 0.0005923192948102951, 0.0006127292290329933, 0.0006331391632556915, 0.0006535490974783897, 0.000673959031701088, 0.0006943689659237862, 0.0007147789001464844]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 3.0, 6.0, 9.0, 8.0, 9.0, 6.0, 14.0, 12.0, 11.0, 17.0, 16.0, 18.0, 15.0, 25.0, 24.0, 39.0, 40.0, 30.0, 45.0, 38.0, 47.0, 47.0, 42.0, 31.0, 41.0, 36.0, 30.0, 42.0, 24.0, 21.0, 28.0, 23.0, 37.0, 24.0, 21.0, 19.0, 18.0, 10.0, 20.0, 3.0, 10.0, 12.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-4.77734375, -4.626220703125, -4.47509765625, -4.323974609375, -4.1728515625, -4.021728515625, -3.87060546875, -3.719482421875, -3.568359375, -3.417236328125, -3.26611328125, -3.114990234375, -2.9638671875, -2.812744140625, -2.66162109375, -2.510498046875, -2.359375, -2.208251953125, -2.05712890625, -1.906005859375, -1.7548828125, -1.603759765625, -1.45263671875, -1.301513671875, -1.150390625, -0.999267578125, -0.84814453125, -0.697021484375, -0.5458984375, -0.394775390625, -0.24365234375, -0.092529296875, 0.05859375, 0.209716796875, 0.36083984375, 0.511962890625, 0.6630859375, 0.814208984375, 0.96533203125, 1.116455078125, 1.267578125, 1.418701171875, 1.56982421875, 1.720947265625, 1.8720703125, 2.023193359375, 2.17431640625, 2.325439453125, 2.4765625, 2.627685546875, 2.77880859375, 2.929931640625, 3.0810546875, 3.232177734375, 3.38330078125, 3.534423828125, 3.685546875, 3.836669921875, 3.98779296875, 4.138916015625, 4.2900390625, 4.441162109375, 4.59228515625, 4.743408203125, 4.89453125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 5.0, 12.0, 9.0, 11.0, 19.0, 26.0, 18.0, 31.0, 38.0, 46.0, 62.0, 90.0, 94.0, 154.0, 202.0, 269.0, 408.0, 581.0, 934.0, 1612.0, 3015.0, 6632.0, 18478.0, 64699.0, 311306.0, 491655.0, 102723.0, 27049.0, 9251.0, 3788.0, 1874.0, 1034.0, 731.0, 442.0, 321.0, 237.0, 175.0, 117.0, 94.0, 84.0, 49.0, 47.0, 42.0, 22.0, 17.0, 7.0, 13.0, 10.0, 8.0, 6.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-7.8515625, -7.599609375, -7.34765625, -7.095703125, -6.84375, -6.591796875, -6.33984375, -6.087890625, -5.8359375, -5.583984375, -5.33203125, -5.080078125, -4.828125, -4.576171875, -4.32421875, -4.072265625, -3.8203125, -3.568359375, -3.31640625, -3.064453125, -2.8125, -2.560546875, -2.30859375, -2.056640625, -1.8046875, -1.552734375, -1.30078125, -1.048828125, -0.796875, -0.544921875, -0.29296875, -0.041015625, 0.2109375, 0.462890625, 0.71484375, 0.966796875, 1.21875, 1.470703125, 1.72265625, 1.974609375, 2.2265625, 2.478515625, 2.73046875, 2.982421875, 3.234375, 3.486328125, 3.73828125, 3.990234375, 4.2421875, 4.494140625, 4.74609375, 4.998046875, 5.25, 5.501953125, 5.75390625, 6.005859375, 6.2578125, 6.509765625, 6.76171875, 7.013671875, 7.265625, 7.517578125, 7.76953125, 8.021484375, 8.2734375]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 5.0, 2.0, 8.0, 10.0, 13.0, 10.0, 15.0, 21.0, 23.0, 28.0, 37.0, 40.0, 53.0, 59.0, 73.0, 136.0, 1726.0, 356.0, 88.0, 50.0, 65.0, 49.0, 32.0, 25.0, 30.0, 18.0, 20.0, 16.0, 14.0, 9.0, 4.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.6875, -16.162353515625, -15.63720703125, -15.112060546875, -14.5869140625, -14.061767578125, -13.53662109375, -13.011474609375, -12.486328125, -11.961181640625, -11.43603515625, -10.910888671875, -10.3857421875, -9.860595703125, -9.33544921875, -8.810302734375, -8.28515625, -7.760009765625, -7.23486328125, -6.709716796875, -6.1845703125, -5.659423828125, -5.13427734375, -4.609130859375, -4.083984375, -3.558837890625, -3.03369140625, -2.508544921875, -1.9833984375, -1.458251953125, -0.93310546875, -0.407958984375, 0.1171875, 0.642333984375, 1.16748046875, 1.692626953125, 2.2177734375, 2.742919921875, 3.26806640625, 3.793212890625, 4.318359375, 4.843505859375, 5.36865234375, 5.893798828125, 6.4189453125, 6.944091796875, 7.46923828125, 7.994384765625, 8.51953125, 9.044677734375, 9.56982421875, 10.094970703125, 10.6201171875, 11.145263671875, 11.67041015625, 12.195556640625, 12.720703125, 13.245849609375, 13.77099609375, 14.296142578125, 14.8212890625, 15.346435546875, 15.87158203125, 16.396728515625, 16.921875]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 4.0, 14.0, 9.0, 21.0, 23.0, 35.0, 51.0, 74.0, 147.0, 306.0, 569.0, 2058.0, 3120946.0, 19560.0, 921.0, 383.0, 221.0, 112.0, 69.0, 37.0, 34.0, 26.0, 15.0, 13.0, 13.0, 9.0, 5.0, 3.0, 2.0, 5.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0], "bins": [-47.53125, -46.033203125, -44.53515625, -43.037109375, -41.5390625, -40.041015625, -38.54296875, -37.044921875, -35.546875, -34.048828125, -32.55078125, -31.052734375, -29.5546875, -28.056640625, -26.55859375, -25.060546875, -23.5625, -22.064453125, -20.56640625, -19.068359375, -17.5703125, -16.072265625, -14.57421875, -13.076171875, -11.578125, -10.080078125, -8.58203125, -7.083984375, -5.5859375, -4.087890625, -2.58984375, -1.091796875, 0.40625, 1.904296875, 3.40234375, 4.900390625, 6.3984375, 7.896484375, 9.39453125, 10.892578125, 12.390625, 13.888671875, 15.38671875, 16.884765625, 18.3828125, 19.880859375, 21.37890625, 22.876953125, 24.375, 25.873046875, 27.37109375, 28.869140625, 30.3671875, 31.865234375, 33.36328125, 34.861328125, 36.359375, 37.857421875, 39.35546875, 40.853515625, 42.3515625, 43.849609375, 45.34765625, 46.845703125, 48.34375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 28.0, 351.0, 552.0, 78.0, 3.0], "bins": [-153.66494750976562, -151.15228271484375, -148.63961791992188, -146.126953125, -143.61428833007812, -141.10162353515625, -138.58895874023438, -136.0762939453125, -133.56362915039062, -131.05096435546875, -128.53829956054688, -126.025634765625, -123.51296997070312, -121.00030517578125, -118.48764038085938, -115.97496795654297, -113.46229553222656, -110.94963073730469, -108.43696594238281, -105.92430114746094, -103.41163635253906, -100.89897155761719, -98.38630676269531, -95.8736343383789, -93.36097717285156, -90.84831237792969, -88.33564758300781, -85.82298278808594, -83.31031799316406, -80.79765319824219, -78.28498840332031, -75.7723159790039, -73.25965118408203, -70.74698638916016, -68.23432159423828, -65.7216567993164, -63.208988189697266, -60.69632339477539, -58.183658599853516, -55.670989990234375, -53.1583251953125, -50.645660400390625, -48.13299560546875, -45.620330810546875, -43.107662200927734, -40.59499740600586, -38.082332611083984, -35.569664001464844, -33.05699920654297, -30.544334411621094, -28.031667709350586, -25.51900291442871, -23.006336212158203, -20.493671417236328, -17.981006622314453, -15.468339920043945, -12.955677032470703, -10.443011283874512, -7.9303460121154785, -5.417680740356445, -2.905014991760254, -0.3923492431640625, 2.1203155517578125, 4.63298225402832, 7.145647048950195]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 8.0, 3.0, 5.0, 4.0, 6.0, 4.0, 4.0, 12.0, 7.0, 10.0, 14.0, 15.0, 19.0, 18.0, 14.0, 18.0, 22.0, 24.0, 29.0, 31.0, 30.0, 23.0, 46.0, 41.0, 36.0, 28.0, 29.0, 35.0, 41.0, 43.0, 40.0, 27.0, 44.0, 21.0, 30.0, 34.0, 21.0, 21.0, 14.0, 14.0, 16.0, 21.0, 9.0, 13.0, 10.0, 8.0, 11.0, 6.0, 4.0, 6.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.029895782470703, -22.220365524291992, -21.41083526611328, -20.60130500793457, -19.79177474975586, -18.98224639892578, -18.172714233398438, -17.36318588256836, -16.55365562438965, -15.744125366210938, -14.934595108032227, -14.125064849853516, -13.315535545349121, -12.50600528717041, -11.6964750289917, -10.886945724487305, -10.077414512634277, -9.267884254455566, -8.458353996276855, -7.648824214935303, -6.83929443359375, -6.029764175415039, -5.220233917236328, -4.410704135894775, -3.6011738777160645, -2.7916438579559326, -1.9821137189865112, -1.1725835800170898, -0.363053560256958, 0.44647645950317383, 1.2560067176818848, 2.0655364990234375, 2.8750667572021484, 3.6845967769622803, 4.494126796722412, 5.303657054901123, 6.113186836242676, 6.922717094421387, 7.732247352600098, 8.541776657104492, 9.351306915283203, 10.160837173461914, 10.970367431640625, 11.779897689819336, 12.58942699432373, 13.398957252502441, 14.208487510681152, 15.018016815185547, 15.827548027038574, 16.63707733154297, 17.44660758972168, 18.25613784790039, 19.0656681060791, 19.875198364257812, 20.684728622436523, 21.494258880615234, 22.303789138793945, 23.113319396972656, 23.922849655151367, 24.732379913330078, 25.54191017150879, 26.3514404296875, 27.160968780517578, 27.97049903869629, 28.780029296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 8.0, 8.0, 7.0, 11.0, 13.0, 13.0, 18.0, 11.0, 23.0, 19.0, 22.0, 19.0, 33.0, 25.0, 34.0, 33.0, 42.0, 44.0, 39.0, 49.0, 54.0, 42.0, 57.0, 38.0, 45.0, 47.0, 33.0, 24.0, 28.0, 32.0, 16.0, 15.0, 22.0, 17.0, 18.0, 11.0, 12.0, 4.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.84765625, -5.646240234375, -5.44482421875, -5.243408203125, -5.0419921875, -4.840576171875, -4.63916015625, -4.437744140625, -4.236328125, -4.034912109375, -3.83349609375, -3.632080078125, -3.4306640625, -3.229248046875, -3.02783203125, -2.826416015625, -2.625, -2.423583984375, -2.22216796875, -2.020751953125, -1.8193359375, -1.617919921875, -1.41650390625, -1.215087890625, -1.013671875, -0.812255859375, -0.61083984375, -0.409423828125, -0.2080078125, -0.006591796875, 0.19482421875, 0.396240234375, 0.59765625, 0.799072265625, 1.00048828125, 1.201904296875, 1.4033203125, 1.604736328125, 1.80615234375, 2.007568359375, 2.208984375, 2.410400390625, 2.61181640625, 2.813232421875, 3.0146484375, 3.216064453125, 3.41748046875, 3.618896484375, 3.8203125, 4.021728515625, 4.22314453125, 4.424560546875, 4.6259765625, 4.827392578125, 5.02880859375, 5.230224609375, 5.431640625, 5.633056640625, 5.83447265625, 6.035888671875, 6.2373046875, 6.438720703125, 6.64013671875, 6.841552734375, 7.04296875]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 6.0, 9.0, 12.0, 14.0, 16.0, 19.0, 18.0, 31.0, 28.0, 48.0, 48.0, 54.0, 75.0, 105.0, 120.0, 165.0, 202.0, 278.0, 422.0, 576.0, 986.0, 2140.0, 15005.0, 1299366.0, 2833588.0, 34309.0, 3028.0, 1105.0, 670.0, 443.0, 338.0, 258.0, 193.0, 150.0, 93.0, 60.0, 58.0, 46.0, 46.0, 36.0, 32.0, 15.0, 20.0, 13.0, 8.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-31.859375, -30.86767578125, -29.8759765625, -28.88427734375, -27.892578125, -26.90087890625, -25.9091796875, -24.91748046875, -23.92578125, -22.93408203125, -21.9423828125, -20.95068359375, -19.958984375, -18.96728515625, -17.9755859375, -16.98388671875, -15.9921875, -15.00048828125, -14.0087890625, -13.01708984375, -12.025390625, -11.03369140625, -10.0419921875, -9.05029296875, -8.05859375, -7.06689453125, -6.0751953125, -5.08349609375, -4.091796875, -3.10009765625, -2.1083984375, -1.11669921875, -0.125, 0.86669921875, 1.8583984375, 2.85009765625, 3.841796875, 4.83349609375, 5.8251953125, 6.81689453125, 7.80859375, 8.80029296875, 9.7919921875, 10.78369140625, 11.775390625, 12.76708984375, 13.7587890625, 14.75048828125, 15.7421875, 16.73388671875, 17.7255859375, 18.71728515625, 19.708984375, 20.70068359375, 21.6923828125, 22.68408203125, 23.67578125, 24.66748046875, 25.6591796875, 26.65087890625, 27.642578125, 28.63427734375, 29.6259765625, 30.61767578125, 31.609375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 9.0, 11.0, 12.0, 29.0, 44.0, 99.0, 178.0, 333.0, 651.0, 914.0, 817.0, 432.0, 237.0, 136.0, 71.0, 47.0, 15.0, 14.0, 8.0, 4.0, 6.0, 1.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0625, -13.533935546875, -13.00537109375, -12.476806640625, -11.9482421875, -11.419677734375, -10.89111328125, -10.362548828125, -9.833984375, -9.305419921875, -8.77685546875, -8.248291015625, -7.7197265625, -7.191162109375, -6.66259765625, -6.134033203125, -5.60546875, -5.076904296875, -4.54833984375, -4.019775390625, -3.4912109375, -2.962646484375, -2.43408203125, -1.905517578125, -1.376953125, -0.848388671875, -0.31982421875, 0.208740234375, 0.7373046875, 1.265869140625, 1.79443359375, 2.322998046875, 2.8515625, 3.380126953125, 3.90869140625, 4.437255859375, 4.9658203125, 5.494384765625, 6.02294921875, 6.551513671875, 7.080078125, 7.608642578125, 8.13720703125, 8.665771484375, 9.1943359375, 9.722900390625, 10.25146484375, 10.780029296875, 11.30859375, 11.837158203125, 12.36572265625, 12.894287109375, 13.4228515625, 13.951416015625, 14.47998046875, 15.008544921875, 15.537109375, 16.065673828125, 16.59423828125, 17.122802734375, 17.6513671875, 18.179931640625, 18.70849609375, 19.237060546875, 19.765625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 7.0, 8.0, 8.0, 16.0, 31.0, 53.0, 83.0, 154.0, 270.0, 684.0, 1651.0, 5292.0, 24381.0, 246216.0, 3152776.0, 700747.0, 49661.0, 8243.0, 2246.0, 917.0, 387.0, 165.0, 104.0, 65.0, 35.0, 20.0, 15.0, 9.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-15.4375, -15.0047607421875, -14.572021484375, -14.1392822265625, -13.70654296875, -13.2738037109375, -12.841064453125, -12.4083251953125, -11.9755859375, -11.5428466796875, -11.110107421875, -10.6773681640625, -10.24462890625, -9.8118896484375, -9.379150390625, -8.9464111328125, -8.513671875, -8.0809326171875, -7.648193359375, -7.2154541015625, -6.78271484375, -6.3499755859375, -5.917236328125, -5.4844970703125, -5.0517578125, -4.6190185546875, -4.186279296875, -3.7535400390625, -3.32080078125, -2.8880615234375, -2.455322265625, -2.0225830078125, -1.58984375, -1.1571044921875, -0.724365234375, -0.2916259765625, 0.14111328125, 0.5738525390625, 1.006591796875, 1.4393310546875, 1.8720703125, 2.3048095703125, 2.737548828125, 3.1702880859375, 3.60302734375, 4.0357666015625, 4.468505859375, 4.9012451171875, 5.333984375, 5.7667236328125, 6.199462890625, 6.6322021484375, 7.06494140625, 7.4976806640625, 7.930419921875, 8.3631591796875, 8.7958984375, 9.2286376953125, 9.661376953125, 10.0941162109375, 10.52685546875, 10.9595947265625, 11.392333984375, 11.8250732421875, 12.2578125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 21.0, 52.0, 124.0, 226.0, 255.0, 166.0, 92.0, 45.0, 15.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.66563415527344, -116.62301635742188, -111.58039855957031, -106.53778076171875, -101.49516296386719, -96.45254516601562, -91.4099349975586, -86.36731719970703, -81.32469940185547, -76.2820816040039, -71.23946380615234, -66.19684600830078, -61.154232025146484, -56.11161422729492, -51.069000244140625, -46.02638244628906, -40.9837646484375, -35.94114685058594, -30.898530960083008, -25.855915069580078, -20.813297271728516, -15.770679473876953, -10.728063583374023, -5.685447692871094, -0.6428298950195312, 4.399786949157715, 9.442403793334961, 14.485020637512207, 19.527637481689453, 24.570255279541016, 29.612871170043945, 34.655487060546875, 39.6981201171875, 44.74073791503906, 49.783355712890625, 54.82596969604492, 59.868587493896484, 64.91120910644531, 69.95381927490234, 74.9964370727539, 80.03905487060547, 85.08167266845703, 90.1242904663086, 95.16690826416016, 100.20951843261719, 105.25213623046875, 110.29475402832031, 115.33737182617188, 120.37998962402344, 125.422607421875, 130.46522521972656, 135.50784301757812, 140.5504608154297, 145.59307861328125, 150.6356964111328, 155.67831420898438, 160.72091674804688, 165.76353454589844, 170.80615234375, 175.84877014160156, 180.89138793945312, 185.9340057373047, 190.97662353515625, 196.01922607421875, 201.06185913085938]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 8.0, 8.0, 8.0, 19.0, 17.0, 10.0, 18.0, 19.0, 29.0, 31.0, 35.0, 34.0, 19.0, 29.0, 46.0, 44.0, 35.0, 40.0, 40.0, 39.0, 35.0, 35.0, 35.0, 32.0, 37.0, 34.0, 27.0, 38.0, 20.0, 26.0, 26.0, 22.0, 20.0, 16.0, 11.0, 7.0, 2.0, 12.0, 8.0, 1.0, 3.0, 8.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.875247955322266, -31.789060592651367, -30.70287322998047, -29.61668586730957, -28.530498504638672, -27.444311141967773, -26.358123779296875, -25.271936416625977, -24.185749053955078, -23.09956169128418, -22.01337432861328, -20.927186965942383, -19.840999603271484, -18.754812240600586, -17.668624877929688, -16.58243751525879, -15.49625015258789, -14.410062789916992, -13.323875427246094, -12.237688064575195, -11.151500701904297, -10.065313339233398, -8.9791259765625, -7.892938613891602, -6.806751251220703, -5.720563888549805, -4.634376525878906, -3.548189163208008, -2.4620018005371094, -1.375814437866211, -0.2896270751953125, 0.7965602874755859, 1.8827476501464844, 2.968935012817383, 4.055122375488281, 5.14130973815918, 6.227497100830078, 7.313684463500977, 8.399871826171875, 9.486059188842773, 10.572246551513672, 11.65843391418457, 12.744621276855469, 13.830808639526367, 14.916996002197266, 16.003183364868164, 17.089370727539062, 18.17555809020996, 19.26174545288086, 20.347932815551758, 21.434120178222656, 22.520307540893555, 23.606494903564453, 24.69268226623535, 25.77886962890625, 26.86505699157715, 27.951244354248047, 29.037431716918945, 30.123619079589844, 31.209806442260742, 32.29599380493164, 33.382179260253906, 34.46836853027344, 35.55455780029297, 36.640743255615234]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 7.0, 5.0, 9.0, 8.0, 8.0, 13.0, 17.0, 20.0, 12.0, 19.0, 25.0, 27.0, 29.0, 41.0, 31.0, 43.0, 31.0, 39.0, 39.0, 58.0, 27.0, 33.0, 37.0, 39.0, 38.0, 37.0, 33.0, 36.0, 41.0, 27.0, 33.0, 21.0, 23.0, 17.0, 15.0, 10.0, 12.0, 4.0, 8.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-60.84375, -58.99853515625, -57.1533203125, -55.30810546875, -53.462890625, -51.61767578125, -49.7724609375, -47.92724609375, -46.08203125, -44.23681640625, -42.3916015625, -40.54638671875, -38.701171875, -36.85595703125, -35.0107421875, -33.16552734375, -31.3203125, -29.47509765625, -27.6298828125, -25.78466796875, -23.939453125, -22.09423828125, -20.2490234375, -18.40380859375, -16.55859375, -14.71337890625, -12.8681640625, -11.02294921875, -9.177734375, -7.33251953125, -5.4873046875, -3.64208984375, -1.796875, 0.04833984375, 1.8935546875, 3.73876953125, 5.583984375, 7.42919921875, 9.2744140625, 11.11962890625, 12.96484375, 14.81005859375, 16.6552734375, 18.50048828125, 20.345703125, 22.19091796875, 24.0361328125, 25.88134765625, 27.7265625, 29.57177734375, 31.4169921875, 33.26220703125, 35.107421875, 36.95263671875, 38.7978515625, 40.64306640625, 42.48828125, 44.33349609375, 46.1787109375, 48.02392578125, 49.869140625, 51.71435546875, 53.5595703125, 55.40478515625, 57.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 13.0, 13.0, 21.0, 29.0, 45.0, 63.0, 94.0, 127.0, 187.0, 265.0, 418.0, 517.0, 794.0, 1126.0, 1666.0, 2370.0, 3625.0, 5111.0, 7523.0, 11144.0, 17112.0, 26538.0, 41898.0, 68344.0, 112167.0, 171683.0, 192703.0, 142653.0, 88303.0, 53985.0, 33536.0, 21496.0, 14059.0, 9208.0, 6201.0, 4183.0, 2926.0, 1886.0, 1325.0, 981.0, 650.0, 485.0, 345.0, 236.0, 153.0, 116.0, 92.0, 48.0, 40.0, 22.0, 14.0, 8.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0], "bins": [-4.85546875, -4.70013427734375, -4.5447998046875, -4.38946533203125, -4.234130859375, -4.07879638671875, -3.9234619140625, -3.76812744140625, -3.61279296875, -3.45745849609375, -3.3021240234375, -3.14678955078125, -2.991455078125, -2.83612060546875, -2.6807861328125, -2.52545166015625, -2.3701171875, -2.21478271484375, -2.0594482421875, -1.90411376953125, -1.748779296875, -1.59344482421875, -1.4381103515625, -1.28277587890625, -1.12744140625, -0.97210693359375, -0.8167724609375, -0.66143798828125, -0.506103515625, -0.35076904296875, -0.1954345703125, -0.04010009765625, 0.115234375, 0.27056884765625, 0.4259033203125, 0.58123779296875, 0.736572265625, 0.89190673828125, 1.0472412109375, 1.20257568359375, 1.35791015625, 1.51324462890625, 1.6685791015625, 1.82391357421875, 1.979248046875, 2.13458251953125, 2.2899169921875, 2.44525146484375, 2.6005859375, 2.75592041015625, 2.9112548828125, 3.06658935546875, 3.221923828125, 3.37725830078125, 3.5325927734375, 3.68792724609375, 3.84326171875, 3.99859619140625, 4.1539306640625, 4.30926513671875, 4.464599609375, 4.61993408203125, 4.7752685546875, 4.93060302734375, 5.0859375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 9.0, 6.0, 14.0, 14.0, 9.0, 12.0, 21.0, 19.0, 17.0, 21.0, 26.0, 25.0, 31.0, 18.0, 28.0, 30.0, 31.0, 46.0, 39.0, 41.0, 1064.0, 32.0, 39.0, 39.0, 37.0, 36.0, 27.0, 37.0, 34.0, 38.0, 29.0, 16.0, 17.0, 20.0, 22.0, 16.0, 9.0, 15.0, 9.0, 10.0, 9.0, 5.0, 5.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.375, -32.28125, -31.1875, -30.09375, -29.0, -27.90625, -26.8125, -25.71875, -24.625, -23.53125, -22.4375, -21.34375, -20.25, -19.15625, -18.0625, -16.96875, -15.875, -14.78125, -13.6875, -12.59375, -11.5, -10.40625, -9.3125, -8.21875, -7.125, -6.03125, -4.9375, -3.84375, -2.75, -1.65625, -0.5625, 0.53125, 1.625, 2.71875, 3.8125, 4.90625, 6.0, 7.09375, 8.1875, 9.28125, 10.375, 11.46875, 12.5625, 13.65625, 14.75, 15.84375, 16.9375, 18.03125, 19.125, 20.21875, 21.3125, 22.40625, 23.5, 24.59375, 25.6875, 26.78125, 27.875, 28.96875, 30.0625, 31.15625, 32.25, 33.34375, 34.4375, 35.53125, 36.625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 7.0, 7.0, 16.0, 34.0, 49.0, 66.0, 103.0, 148.0, 214.0, 335.0, 550.0, 784.0, 1250.0, 1923.0, 3099.0, 4809.0, 7321.0, 11887.0, 18642.0, 30062.0, 49319.0, 84121.0, 138909.0, 1242185.0, 185387.0, 124993.0, 74025.0, 43844.0, 26912.0, 16870.0, 10609.0, 6706.0, 4293.0, 2712.0, 1718.0, 1153.0, 744.0, 437.0, 289.0, 193.0, 143.0, 86.0, 53.0, 38.0, 31.0, 18.0, 10.0, 7.0, 4.0, 7.0, 0.0, 2.0, 1.0, 3.0, 2.0], "bins": [-5.43359375, -5.26837158203125, -5.1031494140625, -4.93792724609375, -4.772705078125, -4.60748291015625, -4.4422607421875, -4.27703857421875, -4.11181640625, -3.94659423828125, -3.7813720703125, -3.61614990234375, -3.450927734375, -3.28570556640625, -3.1204833984375, -2.95526123046875, -2.7900390625, -2.62481689453125, -2.4595947265625, -2.29437255859375, -2.129150390625, -1.96392822265625, -1.7987060546875, -1.63348388671875, -1.46826171875, -1.30303955078125, -1.1378173828125, -0.97259521484375, -0.807373046875, -0.64215087890625, -0.4769287109375, -0.31170654296875, -0.146484375, 0.01873779296875, 0.1839599609375, 0.34918212890625, 0.514404296875, 0.67962646484375, 0.8448486328125, 1.01007080078125, 1.17529296875, 1.34051513671875, 1.5057373046875, 1.67095947265625, 1.836181640625, 2.00140380859375, 2.1666259765625, 2.33184814453125, 2.4970703125, 2.66229248046875, 2.8275146484375, 2.99273681640625, 3.157958984375, 3.32318115234375, 3.4884033203125, 3.65362548828125, 3.81884765625, 3.98406982421875, 4.1492919921875, 4.31451416015625, 4.479736328125, 4.64495849609375, 4.8101806640625, 4.97540283203125, 5.140625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 7.0, 8.0, 7.0, 7.0, 9.0, 20.0, 16.0, 25.0, 35.0, 38.0, 48.0, 39.0, 61.0, 55.0, 66.0, 53.0, 58.0, 69.0, 56.0, 44.0, 50.0, 44.0, 37.0, 19.0, 25.0, 13.0, 13.0, 12.0, 10.0, 8.0, 5.0, 9.0, 2.0, 3.0, 4.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-0.01947021484375, -0.018851041793823242, -0.018231868743896484, -0.017612695693969727, -0.01699352264404297, -0.01637434959411621, -0.015755176544189453, -0.015136003494262695, -0.014516830444335938, -0.01389765739440918, -0.013278484344482422, -0.012659311294555664, -0.012040138244628906, -0.011420965194702148, -0.01080179214477539, -0.010182619094848633, -0.009563446044921875, -0.008944272994995117, -0.00832509994506836, -0.0077059268951416016, -0.007086753845214844, -0.006467580795288086, -0.005848407745361328, -0.00522923469543457, -0.0046100616455078125, -0.003990888595581055, -0.003371715545654297, -0.002752542495727539, -0.0021333694458007812, -0.0015141963958740234, -0.0008950233459472656, -0.0002758502960205078, 0.00034332275390625, 0.0009624958038330078, 0.0015816688537597656, 0.0022008419036865234, 0.0028200149536132812, 0.003439188003540039, 0.004058361053466797, 0.004677534103393555, 0.0052967071533203125, 0.00591588020324707, 0.006535053253173828, 0.007154226303100586, 0.007773399353027344, 0.008392572402954102, 0.00901174545288086, 0.009630918502807617, 0.010250091552734375, 0.010869264602661133, 0.01148843765258789, 0.012107610702514648, 0.012726783752441406, 0.013345956802368164, 0.013965129852294922, 0.01458430290222168, 0.015203475952148438, 0.015822649002075195, 0.016441822052001953, 0.01706099510192871, 0.01768016815185547, 0.018299341201782227, 0.018918514251708984, 0.019537687301635742, 0.0201568603515625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 5.0, 10.0, 5.0, 5.0, 4.0, 7.0, 9.0, 13.0, 17.0, 28.0, 20.0, 33.0, 39.0, 42.0, 58.0, 65.0, 109.0, 122.0, 163.0, 204.0, 327.0, 484.0, 820.0, 1449.0, 2961.0, 8089.0, 31627.0, 168568.0, 487806.0, 271617.0, 52949.0, 12035.0, 4050.0, 1818.0, 1000.0, 594.0, 393.0, 262.0, 176.0, 126.0, 104.0, 70.0, 72.0, 48.0, 34.0, 20.0, 15.0, 17.0, 19.0, 8.0, 13.0, 12.0, 10.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.119140625, -0.11537742614746094, -0.11161422729492188, -0.10785102844238281, -0.10408782958984375, -0.10032463073730469, -0.09656143188476562, -0.09279823303222656, -0.0890350341796875, -0.08527183532714844, -0.08150863647460938, -0.07774543762207031, -0.07398223876953125, -0.07021903991699219, -0.06645584106445312, -0.06269264221191406, -0.058929443359375, -0.05516624450683594, -0.051403045654296875, -0.04763984680175781, -0.04387664794921875, -0.04011344909667969, -0.036350250244140625, -0.03258705139160156, -0.0288238525390625, -0.025060653686523438, -0.021297454833984375, -0.017534255981445312, -0.01377105712890625, -0.010007858276367188, -0.006244659423828125, -0.0024814605712890625, 0.00128173828125, 0.0050449371337890625, 0.008808135986328125, 0.012571334838867188, 0.01633453369140625, 0.020097732543945312, 0.023860931396484375, 0.027624130249023438, 0.0313873291015625, 0.03515052795410156, 0.038913726806640625, 0.04267692565917969, 0.04644012451171875, 0.05020332336425781, 0.053966522216796875, 0.05772972106933594, 0.061492919921875, 0.06525611877441406, 0.06901931762695312, 0.07278251647949219, 0.07654571533203125, 0.08030891418457031, 0.08407211303710938, 0.08783531188964844, 0.0915985107421875, 0.09536170959472656, 0.09912490844726562, 0.10288810729980469, 0.10665130615234375, 0.11041450500488281, 0.11417770385742188, 0.11794090270996094, 0.1217041015625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 8.0, 13.0, 18.0, 32.0, 59.0, 89.0, 157.0, 162.0, 174.0, 120.0, 89.0, 36.0, 23.0, 10.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029040951281785965, -0.02810007706284523, -0.027159204706549644, -0.02621833048760891, -0.025277458131313324, -0.02433658391237259, -0.023395709693431854, -0.02245483547449112, -0.021513963118195534, -0.0205730888992548, -0.019632216542959213, -0.01869134232401848, -0.017750468105077744, -0.016809595748782158, -0.015868721529841423, -0.014927848242223263, -0.013986974954605103, -0.013046101666986942, -0.012105228379368782, -0.011164354160428047, -0.010223480872809887, -0.009282607585191727, -0.008341733366250992, -0.007400860078632832, -0.006459986791014671, -0.005519113503396511, -0.0045782397501170635, -0.0036373662296682596, -0.0026964927092194557, -0.0017556194216012955, -0.0008147456683218479, 0.00012612808495759964, 0.0010670013725757599, 0.002007874893024564, 0.0029487484134733677, 0.0038896219339221716, 0.0048304954543709755, 0.005771368741989136, 0.006712242495268583, 0.007653116248548031, 0.008593989536166191, 0.009534862823784351, 0.010475736111402512, 0.011416610330343246, 0.012357483617961407, 0.013298356905579567, 0.014239231124520302, 0.015180104412138462, 0.016120977699756622, 0.017061851918697357, 0.018002724274992943, 0.018943598493933678, 0.019884470850229263, 0.020825345069169998, 0.021766219288110733, 0.022707093507051468, 0.023647965863347054, 0.02458884008228779, 0.025529712438583374, 0.02647058665752411, 0.027411460876464844, 0.02835233323276043, 0.029293207451701164, 0.03023407980799675, 0.031174954026937485]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 7.0, 8.0, 8.0, 9.0, 15.0, 13.0, 16.0, 16.0, 19.0, 24.0, 21.0, 30.0, 29.0, 33.0, 33.0, 30.0, 48.0, 42.0, 49.0, 36.0, 35.0, 50.0, 43.0, 39.0, 19.0, 29.0, 26.0, 30.0, 37.0, 24.0, 21.0, 27.0, 22.0, 31.0, 8.0, 13.0, 8.0, 12.0, 8.0, 10.0, 5.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010111868381500244, -0.00979091040790081, -0.009469952434301376, -0.009148994460701942, -0.008828036487102509, -0.008507078513503075, -0.00818612053990364, -0.007865162566304207, -0.007544204592704773, -0.007223246619105339, -0.006902288645505905, -0.006581330671906471, -0.006260372698307037, -0.0059394147247076035, -0.0056184567511081696, -0.005297498777508736, -0.004976540803909302, -0.004655582830309868, -0.004334624856710434, -0.004013666883111, -0.003692708909511566, -0.0033717509359121323, -0.0030507929623126984, -0.0027298349887132645, -0.0024088770151138306, -0.0020879190415143967, -0.0017669610679149628, -0.0014460030943155289, -0.001125045120716095, -0.0008040871471166611, -0.00048312917351722717, -0.00016217119991779327, 0.00015878677368164062, 0.0004797447472810745, 0.0008007027208805084, 0.0011216606944799423, 0.0014426186680793762, 0.0017635766416788101, 0.002084534615278244, 0.002405492588877678, 0.002726450562477112, 0.0030474085360765457, 0.0033683665096759796, 0.0036893244832754135, 0.004010282456874847, 0.004331240430474281, 0.004652198404073715, 0.004973156377673149, 0.005294114351272583, 0.005615072324872017, 0.005936030298471451, 0.006256988272070885, 0.006577946245670319, 0.0068989042192697525, 0.007219862192869186, 0.00754082016646862, 0.007861778140068054, 0.008182736113667488, 0.008503694087266922, 0.008824652060866356, 0.00914561003446579, 0.009466568008065224, 0.009787525981664658, 0.010108483955264091, 0.010429441928863525]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 7.0, 5.0, 9.0, 8.0, 7.0, 14.0, 17.0, 20.0, 12.0, 18.0, 26.0, 27.0, 29.0, 38.0, 34.0, 41.0, 33.0, 39.0, 38.0, 57.0, 29.0, 31.0, 39.0, 38.0, 39.0, 37.0, 31.0, 36.0, 43.0, 27.0, 32.0, 22.0, 22.0, 17.0, 16.0, 10.0, 11.0, 5.0, 8.0, 8.0, 4.0, 6.0, 5.0, 1.0, 1.0, 1.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0], "bins": [-60.875, -59.0302734375, -57.185546875, -55.3408203125, -53.49609375, -51.6513671875, -49.806640625, -47.9619140625, -46.1171875, -44.2724609375, -42.427734375, -40.5830078125, -38.73828125, -36.8935546875, -35.048828125, -33.2041015625, -31.359375, -29.5146484375, -27.669921875, -25.8251953125, -23.98046875, -22.1357421875, -20.291015625, -18.4462890625, -16.6015625, -14.7568359375, -12.912109375, -11.0673828125, -9.22265625, -7.3779296875, -5.533203125, -3.6884765625, -1.84375, 0.0009765625, 1.845703125, 3.6904296875, 5.53515625, 7.3798828125, 9.224609375, 11.0693359375, 12.9140625, 14.7587890625, 16.603515625, 18.4482421875, 20.29296875, 22.1376953125, 23.982421875, 25.8271484375, 27.671875, 29.5166015625, 31.361328125, 33.2060546875, 35.05078125, 36.8955078125, 38.740234375, 40.5849609375, 42.4296875, 44.2744140625, 46.119140625, 47.9638671875, 49.80859375, 51.6533203125, 53.498046875, 55.3427734375, 57.1875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 11.0, 10.0, 11.0, 13.0, 21.0, 24.0, 41.0, 73.0, 74.0, 104.0, 185.0, 242.0, 511.0, 828.0, 1521.0, 2982.0, 6660.0, 17994.0, 72826.0, 417862.0, 421263.0, 73687.0, 18189.0, 6745.0, 3049.0, 1479.0, 812.0, 448.0, 288.0, 188.0, 108.0, 82.0, 55.0, 37.0, 26.0, 17.0, 20.0, 11.0, 11.0, 9.0, 7.0, 5.0, 5.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.578125, -16.0758056640625, -15.573486328125, -15.0711669921875, -14.56884765625, -14.0665283203125, -13.564208984375, -13.0618896484375, -12.5595703125, -12.0572509765625, -11.554931640625, -11.0526123046875, -10.55029296875, -10.0479736328125, -9.545654296875, -9.0433349609375, -8.541015625, -8.0386962890625, -7.536376953125, -7.0340576171875, -6.53173828125, -6.0294189453125, -5.527099609375, -5.0247802734375, -4.5224609375, -4.0201416015625, -3.517822265625, -3.0155029296875, -2.51318359375, -2.0108642578125, -1.508544921875, -1.0062255859375, -0.50390625, -0.0015869140625, 0.500732421875, 1.0030517578125, 1.50537109375, 2.0076904296875, 2.510009765625, 3.0123291015625, 3.5146484375, 4.0169677734375, 4.519287109375, 5.0216064453125, 5.52392578125, 6.0262451171875, 6.528564453125, 7.0308837890625, 7.533203125, 8.0355224609375, 8.537841796875, 9.0401611328125, 9.54248046875, 10.0447998046875, 10.547119140625, 11.0494384765625, 11.5517578125, 12.0540771484375, 12.556396484375, 13.0587158203125, 13.56103515625, 14.0633544921875, 14.565673828125, 15.0679931640625, 15.5703125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 20.0, 11.0, 49.0, 70.0, 100.0, 128.0, 2200.0, 150.0, 115.0, 82.0, 58.0, 35.0, 14.0, 11.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-235.875, -227.638671875, -219.40234375, -211.166015625, -202.9296875, -194.693359375, -186.45703125, -178.220703125, -169.984375, -161.748046875, -153.51171875, -145.275390625, -137.0390625, -128.802734375, -120.56640625, -112.330078125, -104.09375, -95.857421875, -87.62109375, -79.384765625, -71.1484375, -62.912109375, -54.67578125, -46.439453125, -38.203125, -29.966796875, -21.73046875, -13.494140625, -5.2578125, 2.978515625, 11.21484375, 19.451171875, 27.6875, 35.923828125, 44.16015625, 52.396484375, 60.6328125, 68.869140625, 77.10546875, 85.341796875, 93.578125, 101.814453125, 110.05078125, 118.287109375, 126.5234375, 134.759765625, 142.99609375, 151.232421875, 159.46875, 167.705078125, 175.94140625, 184.177734375, 192.4140625, 200.650390625, 208.88671875, 217.123046875, 225.359375, 233.595703125, 241.83203125, 250.068359375, 258.3046875, 266.541015625, 274.77734375, 283.013671875, 291.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 12.0, 18.0, 41.0, 48.0, 92.0, 186.0, 408.0, 942.0, 3591.0, 132671.0, 2994649.0, 10391.0, 1526.0, 594.0, 256.0, 113.0, 62.0, 38.0, 24.0, 17.0, 6.0, 4.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.96875, -55.39599609375, -53.8232421875, -52.25048828125, -50.677734375, -49.10498046875, -47.5322265625, -45.95947265625, -44.38671875, -42.81396484375, -41.2412109375, -39.66845703125, -38.095703125, -36.52294921875, -34.9501953125, -33.37744140625, -31.8046875, -30.23193359375, -28.6591796875, -27.08642578125, -25.513671875, -23.94091796875, -22.3681640625, -20.79541015625, -19.22265625, -17.64990234375, -16.0771484375, -14.50439453125, -12.931640625, -11.35888671875, -9.7861328125, -8.21337890625, -6.640625, -5.06787109375, -3.4951171875, -1.92236328125, -0.349609375, 1.22314453125, 2.7958984375, 4.36865234375, 5.94140625, 7.51416015625, 9.0869140625, 10.65966796875, 12.232421875, 13.80517578125, 15.3779296875, 16.95068359375, 18.5234375, 20.09619140625, 21.6689453125, 23.24169921875, 24.814453125, 26.38720703125, 27.9599609375, 29.53271484375, 31.10546875, 32.67822265625, 34.2509765625, 35.82373046875, 37.396484375, 38.96923828125, 40.5419921875, 42.11474609375, 43.6875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 8.0, 9.0, 19.0, 54.0, 177.0, 366.0, 246.0, 73.0, 30.0, 8.0, 8.0, 3.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-554.8307495117188, -543.8906860351562, -532.9505615234375, -522.010498046875, -511.07037353515625, -500.1302795410156, -489.190185546875, -478.2500915527344, -467.30999755859375, -456.3699035644531, -445.4298095703125, -434.4897155761719, -423.54962158203125, -412.6095275878906, -401.66943359375, -390.7293395996094, -379.78924560546875, -368.8491516113281, -357.9090576171875, -346.9689636230469, -336.02886962890625, -325.0887756347656, -314.148681640625, -303.2085876464844, -292.2685241699219, -281.32843017578125, -270.3883361816406, -259.4482421875, -248.50814819335938, -237.56805419921875, -226.62796020507812, -215.6878662109375, -204.7477569580078, -193.8076629638672, -182.86756896972656, -171.92747497558594, -160.9873809814453, -150.0472869873047, -139.10720825195312, -128.1671142578125, -117.22701263427734, -106.28691864013672, -95.3468246459961, -84.40673828125, -73.46664428710938, -62.526546478271484, -51.586456298828125, -40.6463623046875, -29.706268310546875, -18.76617431640625, -7.826082229614258, 3.1140098571777344, 14.05410385131836, 24.994197845458984, 35.934288024902344, 46.87438201904297, 57.814476013183594, 68.75457000732422, 79.69466400146484, 90.63475036621094, 101.57484436035156, 112.51493835449219, 123.45503234863281, 134.39512634277344, 145.33522033691406]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 7.0, 8.0, 7.0, 8.0, 12.0, 17.0, 10.0, 23.0, 25.0, 19.0, 22.0, 17.0, 19.0, 28.0, 39.0, 41.0, 24.0, 35.0, 45.0, 38.0, 30.0, 42.0, 49.0, 35.0, 39.0, 45.0, 36.0, 29.0, 28.0, 38.0, 23.0, 22.0, 18.0, 23.0, 11.0, 13.0, 13.0, 16.0, 15.0, 4.0, 6.0, 7.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 1.0], "bins": [-106.38986206054688, -103.12745666503906, -99.86505889892578, -96.60265350341797, -93.34024810791016, -90.07785034179688, -86.81544494628906, -83.55303955078125, -80.29063415527344, -77.02822875976562, -73.76583099365234, -70.50342559814453, -67.24102020263672, -63.97861862182617, -60.716217041015625, -57.45381164550781, -54.19141387939453, -50.929012298583984, -47.66660690307617, -44.404205322265625, -41.14179992675781, -37.879398345947266, -34.61699676513672, -31.35459327697754, -28.09218978881836, -24.82978630065918, -21.5673828125, -18.304981231689453, -15.042577743530273, -11.780174255371094, -8.517772674560547, -5.255369186401367, -1.9929733276367188, 1.2694296836853027, 4.531832695007324, 7.7942352294921875, 11.056638717651367, 14.319042205810547, 17.581443786621094, 20.843847274780273, 24.106250762939453, 27.368654251098633, 30.631057739257812, 33.89345932006836, 37.155860900878906, 40.41826629638672, 43.680667877197266, 46.94306945800781, 50.205474853515625, 53.46787643432617, 56.730281829833984, 59.99268341064453, 63.255088806152344, 66.51748657226562, 69.77989196777344, 73.04229736328125, 76.30470275878906, 79.56710815429688, 82.82950592041016, 86.09191131591797, 89.35431671142578, 92.61671447753906, 95.87911987304688, 99.14152526855469, 102.40392303466797]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 8.0, 8.0, 7.0, 4.0, 9.0, 8.0, 13.0, 20.0, 28.0, 31.0, 31.0, 39.0, 74.0, 84.0, 112.0, 142.0, 182.0, 261.0, 285.0, 347.0, 497.0, 616.0, 819.0, 1039981.0, 1470.0, 787.0, 559.0, 480.0, 355.0, 291.0, 221.0, 195.0, 142.0, 117.0, 82.0, 59.0, 49.0, 37.0, 28.0, 18.0, 17.0, 9.0, 9.0, 11.0, 7.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.206989288330078, -30.12735939025879, -29.047731399536133, -27.968101501464844, -26.888473510742188, -25.8088436126709, -24.72921371459961, -23.649585723876953, -22.569955825805664, -21.490325927734375, -20.41069793701172, -19.33106803894043, -18.25143814086914, -17.171810150146484, -16.092180252075195, -15.012551307678223, -13.93292236328125, -12.853293418884277, -11.773664474487305, -10.694034576416016, -9.614405632019043, -8.53477668762207, -7.4551472663879395, -6.375517845153809, -5.295888900756836, -4.216259956359863, -3.1366305351257324, -2.0570013523101807, -0.9773721694946289, 0.10225677490234375, 1.1818861961364746, 2.2615156173706055, 3.3411483764648438, 4.420777320861816, 5.500406742095947, 6.580036163330078, 7.659665107727051, 8.739294052124023, 9.818923950195312, 10.898552894592285, 11.978181838989258, 13.05781078338623, 14.137439727783203, 15.217069625854492, 16.29669952392578, 17.376327514648438, 18.455957412719727, 19.535587310791016, 20.615215301513672, 21.69484519958496, 22.774473190307617, 23.854103088378906, 24.933731079101562, 26.01336097717285, 27.09299087524414, 28.172618865966797, 29.252248764038086, 30.331878662109375, 31.41150665283203, 32.49113464355469, 33.57076644897461, 34.650394439697266, 35.73002243041992, 36.809654235839844, 37.8892822265625]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 6.0, 2.0, 4.0, 7.0, 8.0, 10.0, 15.0, 11.0, 23.0, 72.0, 419.0, 51462140.0, 244.0, 58.0, 37.0, 17.0, 9.0, 7.0, 8.0, 4.0, 3.0, 1.0, 3.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3487.510009765625, -3332.45751953125, -3177.4052734375, -3022.352783203125, -2867.300537109375, -2712.248046875, -2557.19580078125, -2402.143310546875, -2247.0908203125, -2092.038330078125, -1936.986083984375, -1781.93359375, -1626.88134765625, -1471.828857421875, -1316.7764892578125, -1161.72412109375, -1006.671875, -851.6195068359375, -696.567138671875, -541.5147094726562, -386.46234130859375, -231.40997314453125, -76.3575439453125, 78.69482421875, 233.7471923828125, 388.799560546875, 543.8519287109375, 698.9043579101562, 853.9567260742188, 1009.0090942382812, 1164.0615234375, 1319.1138916015625, 1474.16650390625, 1629.2188720703125, 1784.271240234375, 1939.32373046875, 2094.3759765625, 2249.428466796875, 2404.48095703125, 2559.533203125, 2714.58544921875, 2869.637939453125, 3024.690185546875, 3179.74267578125, 3334.794921875, 3489.847412109375, 3644.89990234375, 3799.9521484375, 3955.004638671875, 4110.05712890625, 4265.109375, 4420.16162109375, 4575.21435546875, 4730.2666015625, 4885.31884765625, 5040.37109375, 5195.423828125, 5350.47607421875, 5505.52880859375, 5660.5810546875, 5815.63330078125, 5970.685546875, 6125.73828125, 6280.79052734375, 6435.8427734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 7.0, 9.0, 16.0, 24.0, 38.0, 44.0, 95.0, 149.0, 216.0, 312.0, 450.0, 689.0, 1061.0, 1505.0, 2383.0, 3710.0, 5822.0, 9180.0, 14993.0, 24707.0, 41673.0, 72005.0, 129084.0, 234578.0, 421350.0, 2462647.0, 1917173.0, 414374.0, 231019.0, 126325.0, 70860.0, 40493.0, 23995.0, 14794.0, 9170.0, 5825.0, 3672.0, 2326.0, 1574.0, 1031.0, 691.0, 487.0, 308.0, 196.0, 133.0, 80.0, 56.0, 37.0, 22.0, 27.0, 13.0, 8.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.34765625, -2.26934814453125, -2.1910400390625, -2.11273193359375, -2.034423828125, -1.95611572265625, -1.8778076171875, -1.79949951171875, -1.72119140625, -1.64288330078125, -1.5645751953125, -1.48626708984375, -1.407958984375, -1.32965087890625, -1.2513427734375, -1.17303466796875, -1.0947265625, -1.01641845703125, -0.9381103515625, -0.85980224609375, -0.781494140625, -0.70318603515625, -0.6248779296875, -0.54656982421875, -0.46826171875, -0.38995361328125, -0.3116455078125, -0.23333740234375, -0.155029296875, -0.07672119140625, 0.0015869140625, 0.07989501953125, 0.158203125, 0.23651123046875, 0.3148193359375, 0.39312744140625, 0.471435546875, 0.54974365234375, 0.6280517578125, 0.70635986328125, 0.78466796875, 0.86297607421875, 0.9412841796875, 1.01959228515625, 1.097900390625, 1.17620849609375, 1.2545166015625, 1.33282470703125, 1.4111328125, 1.48944091796875, 1.5677490234375, 1.64605712890625, 1.724365234375, 1.80267333984375, 1.8809814453125, 1.95928955078125, 2.03759765625, 2.11590576171875, 2.1942138671875, 2.27252197265625, 2.350830078125, 2.42913818359375, 2.5074462890625, 2.58575439453125, 2.6640625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 7.0, 5.0, 6.0, 9.0, 5.0, 4.0, 12.0, 15.0, 24.0, 21.0, 20.0, 24.0, 40.0, 39.0, 37.0, 47.0, 50.0, 42.0, 64.0, 366.0, 727.0, 50.0, 45.0, 46.0, 41.0, 35.0, 31.0, 36.0, 29.0, 24.0, 17.0, 26.0, 22.0, 13.0, 13.0, 12.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.765625, -14.3065185546875, -13.847412109375, -13.3883056640625, -12.92919921875, -12.4700927734375, -12.010986328125, -11.5518798828125, -11.0927734375, -10.6336669921875, -10.174560546875, -9.7154541015625, -9.25634765625, -8.7972412109375, -8.338134765625, -7.8790283203125, -7.419921875, -6.9608154296875, -6.501708984375, -6.0426025390625, -5.58349609375, -5.1243896484375, -4.665283203125, -4.2061767578125, -3.7470703125, -3.2879638671875, -2.828857421875, -2.3697509765625, -1.91064453125, -1.4515380859375, -0.992431640625, -0.5333251953125, -0.07421875, 0.3848876953125, 0.843994140625, 1.3031005859375, 1.76220703125, 2.2213134765625, 2.680419921875, 3.1395263671875, 3.5986328125, 4.0577392578125, 4.516845703125, 4.9759521484375, 5.43505859375, 5.8941650390625, 6.353271484375, 6.8123779296875, 7.271484375, 7.7305908203125, 8.189697265625, 8.6488037109375, 9.10791015625, 9.5670166015625, 10.026123046875, 10.4852294921875, 10.9443359375, 11.4034423828125, 11.862548828125, 12.3216552734375, 12.78076171875, 13.2398681640625, 13.698974609375, 14.1580810546875, 14.6171875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 1.0, 4.0, 12.0, 13.0, 14.0, 32.0, 48.0, 77.0, 101.0, 163.0, 242.0, 416.0, 576.0, 887.0, 1316.0, 2109.0, 3142.0, 4693.0, 7217.0, 10766.0, 17148.0, 26569.0, 41934.0, 67815.0, 111488.0, 186995.0, 306314.0, 506348.0, 3463322.0, 637709.0, 346962.0, 211107.0, 127597.0, 77143.0, 47544.0, 29956.0, 18909.0, 11970.0, 7745.0, 5107.0, 3354.0, 2135.0, 1468.0, 936.0, 661.0, 467.0, 311.0, 210.0, 138.0, 105.0, 59.0, 29.0, 21.0, 11.0, 10.0, 8.0, 4.0, 5.0, 0.0, 1.0, 3.0], "bins": [-2.09375, -2.027557373046875, -1.96136474609375, -1.895172119140625, -1.8289794921875, -1.762786865234375, -1.69659423828125, -1.630401611328125, -1.564208984375, -1.498016357421875, -1.43182373046875, -1.365631103515625, -1.2994384765625, -1.233245849609375, -1.16705322265625, -1.100860595703125, -1.03466796875, -0.968475341796875, -0.90228271484375, -0.836090087890625, -0.7698974609375, -0.703704833984375, -0.63751220703125, -0.571319580078125, -0.505126953125, -0.438934326171875, -0.37274169921875, -0.306549072265625, -0.2403564453125, -0.174163818359375, -0.10797119140625, -0.041778564453125, 0.0244140625, 0.090606689453125, 0.15679931640625, 0.222991943359375, 0.2891845703125, 0.355377197265625, 0.42156982421875, 0.487762451171875, 0.553955078125, 0.620147705078125, 0.68634033203125, 0.752532958984375, 0.8187255859375, 0.884918212890625, 0.95111083984375, 1.017303466796875, 1.08349609375, 1.149688720703125, 1.21588134765625, 1.282073974609375, 1.3482666015625, 1.414459228515625, 1.48065185546875, 1.546844482421875, 1.613037109375, 1.679229736328125, 1.74542236328125, 1.811614990234375, 1.8778076171875, 1.944000244140625, 2.01019287109375, 2.076385498046875, 2.142578125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 5.0, 5.0, 11.0, 14.0, 6.0, 19.0, 13.0, 11.0, 18.0, 17.0, 24.0, 21.0, 25.0, 31.0, 25.0, 32.0, 29.0, 38.0, 36.0, 42.0, 101.0, 518.0, 499.0, 63.0, 36.0, 38.0, 32.0, 26.0, 35.0, 29.0, 27.0, 34.0, 23.0, 21.0, 22.0, 14.0, 14.0, 6.0, 8.0, 4.0, 5.0, 6.0, 9.0, 9.0, 5.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-8.5234375, -8.26544189453125, -8.0074462890625, -7.74945068359375, -7.491455078125, -7.23345947265625, -6.9754638671875, -6.71746826171875, -6.45947265625, -6.20147705078125, -5.9434814453125, -5.68548583984375, -5.427490234375, -5.16949462890625, -4.9114990234375, -4.65350341796875, -4.3955078125, -4.13751220703125, -3.8795166015625, -3.62152099609375, -3.363525390625, -3.10552978515625, -2.8475341796875, -2.58953857421875, -2.33154296875, -2.07354736328125, -1.8155517578125, -1.55755615234375, -1.299560546875, -1.04156494140625, -0.7835693359375, -0.52557373046875, -0.267578125, -0.00958251953125, 0.2484130859375, 0.50640869140625, 0.764404296875, 1.02239990234375, 1.2803955078125, 1.53839111328125, 1.79638671875, 2.05438232421875, 2.3123779296875, 2.57037353515625, 2.828369140625, 3.08636474609375, 3.3443603515625, 3.60235595703125, 3.8603515625, 4.11834716796875, 4.3763427734375, 4.63433837890625, 4.892333984375, 5.15032958984375, 5.4083251953125, 5.66632080078125, 5.92431640625, 6.18231201171875, 6.4403076171875, 6.69830322265625, 6.956298828125, 7.21429443359375, 7.4722900390625, 7.73028564453125, 7.98828125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 5.0, 5.0, 8.0, 8.0, 21.0, 22.0, 23.0, 39.0, 57.0, 51.0, 87.0, 92.0, 127.0, 212.0, 248.0, 309.0, 407.0, 601.0, 856.0, 1257.0, 2034.0, 3319.0, 5634.0, 10925.0, 20985.0, 46182.0, 127071.0, 5750424.0, 200802.0, 60734.0, 26954.0, 13450.0, 7217.0, 3870.0, 2328.0, 1530.0, 986.0, 650.0, 503.0, 329.0, 265.0, 220.0, 159.0, 120.0, 78.0, 63.0, 40.0, 33.0, 25.0, 16.0, 15.0, 16.0, 12.0, 5.0, 6.0, 8.0, 2.0, 3.0, 1.0], "bins": [-6.86328125, -6.65313720703125, -6.4429931640625, -6.23284912109375, -6.022705078125, -5.81256103515625, -5.6024169921875, -5.39227294921875, -5.18212890625, -4.97198486328125, -4.7618408203125, -4.55169677734375, -4.341552734375, -4.13140869140625, -3.9212646484375, -3.71112060546875, -3.5009765625, -3.29083251953125, -3.0806884765625, -2.87054443359375, -2.660400390625, -2.45025634765625, -2.2401123046875, -2.02996826171875, -1.81982421875, -1.60968017578125, -1.3995361328125, -1.18939208984375, -0.979248046875, -0.76910400390625, -0.5589599609375, -0.34881591796875, -0.138671875, 0.07147216796875, 0.2816162109375, 0.49176025390625, 0.701904296875, 0.91204833984375, 1.1221923828125, 1.33233642578125, 1.54248046875, 1.75262451171875, 1.9627685546875, 2.17291259765625, 2.383056640625, 2.59320068359375, 2.8033447265625, 3.01348876953125, 3.2236328125, 3.43377685546875, 3.6439208984375, 3.85406494140625, 4.064208984375, 4.27435302734375, 4.4844970703125, 4.69464111328125, 4.90478515625, 5.11492919921875, 5.3250732421875, 5.53521728515625, 5.745361328125, 5.95550537109375, 6.1656494140625, 6.37579345703125, 6.5859375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 4.0, 7.0, 10.0, 10.0, 13.0, 17.0, 13.0, 18.0, 31.0, 25.0, 18.0, 27.0, 26.0, 38.0, 34.0, 42.0, 43.0, 49.0, 97.0, 352.0, 602.0, 111.0, 45.0, 35.0, 43.0, 44.0, 27.0, 36.0, 29.0, 26.0, 20.0, 21.0, 20.0, 16.0, 13.0, 13.0, 9.0, 10.0, 12.0, 5.0, 7.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.19921875, -5.9947509765625, -5.790283203125, -5.5858154296875, -5.38134765625, -5.1768798828125, -4.972412109375, -4.7679443359375, -4.5634765625, -4.3590087890625, -4.154541015625, -3.9500732421875, -3.74560546875, -3.5411376953125, -3.336669921875, -3.1322021484375, -2.927734375, -2.7232666015625, -2.518798828125, -2.3143310546875, -2.10986328125, -1.9053955078125, -1.700927734375, -1.4964599609375, -1.2919921875, -1.0875244140625, -0.883056640625, -0.6785888671875, -0.47412109375, -0.2696533203125, -0.065185546875, 0.1392822265625, 0.34375, 0.5482177734375, 0.752685546875, 0.9571533203125, 1.16162109375, 1.3660888671875, 1.570556640625, 1.7750244140625, 1.9794921875, 2.1839599609375, 2.388427734375, 2.5928955078125, 2.79736328125, 3.0018310546875, 3.206298828125, 3.4107666015625, 3.615234375, 3.8197021484375, 4.024169921875, 4.2286376953125, 4.43310546875, 4.6375732421875, 4.842041015625, 5.0465087890625, 5.2509765625, 5.4554443359375, 5.659912109375, 5.8643798828125, 6.06884765625, 6.2733154296875, 6.477783203125, 6.6822509765625, 6.88671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 2.0, 2.0, 3.0, 9.0, 4.0, 12.0, 17.0, 33.0, 42.0, 86.0, 130.0, 173.0, 182.0, 144.0, 77.0, 42.0, 23.0, 12.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-29.267953872680664, -28.696414947509766, -28.124876022338867, -27.55333709716797, -26.981796264648438, -26.41025733947754, -25.83871841430664, -25.267179489135742, -24.695640563964844, -24.124101638793945, -23.552562713623047, -22.98102378845215, -22.40948486328125, -21.83794403076172, -21.26640510559082, -20.694866180419922, -20.123327255249023, -19.551788330078125, -18.980249404907227, -18.408710479736328, -17.837169647216797, -17.2656307220459, -16.694091796875, -16.1225528717041, -15.551013946533203, -14.979475021362305, -14.407936096191406, -13.836396217346191, -13.264857292175293, -12.693318367004395, -12.12177848815918, -11.550239562988281, -10.97869873046875, -10.407159805297852, -9.835620880126953, -9.264081001281738, -8.69254207611084, -8.121003150939941, -7.549463748931885, -6.977924346923828, -6.40638542175293, -5.834846496582031, -5.263307094573975, -4.691767692565918, -4.1202287673950195, -3.548689603805542, -2.9771504402160645, -2.405611038208008, -1.8340721130371094, -1.2625329494476318, -0.6909937858581543, -0.11945462226867676, 0.4520845413208008, 1.0236237049102783, 1.5951628684997559, 2.1667022705078125, 2.738241195678711, 3.3097803592681885, 3.881319522857666, 4.452858924865723, 5.024397850036621, 5.5959367752075195, 6.167476177215576, 6.739015579223633, 7.310554504394531]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 3.0, 0.0, 6.0, 9.0, 3.0, 11.0, 12.0, 14.0, 14.0, 11.0, 18.0, 19.0, 17.0, 14.0, 28.0, 25.0, 29.0, 27.0, 46.0, 33.0, 34.0, 34.0, 38.0, 24.0, 42.0, 27.0, 42.0, 43.0, 32.0, 34.0, 31.0, 35.0, 17.0, 29.0, 21.0, 25.0, 21.0, 21.0, 19.0, 13.0, 14.0, 9.0, 9.0, 11.0, 9.0, 6.0, 8.0, 4.0, 0.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0], "bins": [-8.571405410766602, -8.316587448120117, -8.061769485473633, -7.806950569152832, -7.552132606506348, -7.297314643859863, -7.042496204376221, -6.787677764892578, -6.532859802246094, -6.278041839599609, -6.023223400115967, -5.768404960632324, -5.51358699798584, -5.2587690353393555, -5.003950595855713, -4.74913215637207, -4.494314193725586, -4.239496231079102, -3.984677791595459, -3.7298595905303955, -3.475041389465332, -3.2202231884002686, -2.965404987335205, -2.7105867862701416, -2.455768585205078, -2.2009503841400146, -1.9461321830749512, -1.6913139820098877, -1.4364957809448242, -1.1816775798797607, -0.9268593788146973, -0.6720411777496338, -0.4172229766845703, -0.16240477561950684, 0.09241342544555664, 0.3472316265106201, 0.6020498275756836, 0.8568680286407471, 1.1116862297058105, 1.366504430770874, 1.6213226318359375, 1.876140832901001, 2.1309590339660645, 2.385777235031128, 2.6405954360961914, 2.895413637161255, 3.1502318382263184, 3.405050039291382, 3.6598682403564453, 3.914686441421509, 4.169504642486572, 4.424323081970215, 4.679141044616699, 4.933959007263184, 5.188777446746826, 5.443595886230469, 5.698413848876953, 5.9532318115234375, 6.20805025100708, 6.462868690490723, 6.717686653137207, 6.972504615783691, 7.227323055267334, 7.482141494750977, 7.736959457397461]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 9.0, 3.0, 8.0, 10.0, 16.0, 29.0, 31.0, 48.0, 40.0, 70.0, 113.0, 135.0, 164.0, 246.0, 400.0, 555.0, 857.0, 1378.0, 2408.0, 4605.0, 10066.0, 28132.0, 178355.0, 3892740.0, 48356.0, 13146.0, 5436.0, 2637.0, 1483.0, 924.0, 578.0, 386.0, 260.0, 168.0, 118.0, 97.0, 63.0, 58.0, 30.0, 24.0, 26.0, 15.0, 15.0, 7.0, 3.0, 11.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.356201171875, -0.3447990417480469, -0.33339691162109375, -0.3219947814941406, -0.3105926513671875, -0.2991905212402344, -0.28778839111328125, -0.2763862609863281, -0.264984130859375, -0.2535820007324219, -0.24217987060546875, -0.23077774047851562, -0.2193756103515625, -0.20797348022460938, -0.19657135009765625, -0.18516921997070312, -0.17376708984375, -0.16236495971679688, -0.15096282958984375, -0.13956069946289062, -0.1281585693359375, -0.11675643920898438, -0.10535430908203125, -0.09395217895507812, -0.082550048828125, -0.07114791870117188, -0.05974578857421875, -0.048343658447265625, -0.0369415283203125, -0.025539398193359375, -0.01413726806640625, -0.002735137939453125, 0.0086669921875, 0.020069122314453125, 0.03147125244140625, 0.042873382568359375, 0.0542755126953125, 0.06567764282226562, 0.07707977294921875, 0.08848190307617188, 0.099884033203125, 0.11128616333007812, 0.12268829345703125, 0.13409042358398438, 0.1454925537109375, 0.15689468383789062, 0.16829681396484375, 0.17969894409179688, 0.19110107421875, 0.20250320434570312, 0.21390533447265625, 0.22530746459960938, 0.2367095947265625, 0.24811172485351562, 0.25951385498046875, 0.2709159851074219, 0.282318115234375, 0.2937202453613281, 0.30512237548828125, 0.3165245056152344, 0.3279266357421875, 0.3393287658691406, 0.35073089599609375, 0.3621330261230469, 0.37353515625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 4.0, 3.0, 10.0, 9.0, 12.0, 15.0, 11.0, 13.0, 19.0, 42.0, 740.0, 19.0, 16.0, 7.0, 9.0, 8.0, 6.0, 5.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.066650390625, -0.0646367073059082, -0.0626230239868164, -0.06060934066772461, -0.05859565734863281, -0.056581974029541016, -0.05456829071044922, -0.05255460739135742, -0.050540924072265625, -0.04852724075317383, -0.04651355743408203, -0.044499874114990234, -0.04248619079589844, -0.04047250747680664, -0.038458824157714844, -0.03644514083862305, -0.03443145751953125, -0.03241777420043945, -0.030404090881347656, -0.02839040756225586, -0.026376724243164062, -0.024363040924072266, -0.02234935760498047, -0.020335674285888672, -0.018321990966796875, -0.016308307647705078, -0.014294624328613281, -0.012280941009521484, -0.010267257690429688, -0.00825357437133789, -0.006239891052246094, -0.004226207733154297, -0.0022125244140625, -0.00019884109497070312, 0.0018148422241210938, 0.0038285255432128906, 0.0058422088623046875, 0.007855892181396484, 0.009869575500488281, 0.011883258819580078, 0.013896942138671875, 0.015910625457763672, 0.01792430877685547, 0.019937992095947266, 0.021951675415039062, 0.02396535873413086, 0.025979042053222656, 0.027992725372314453, 0.03000640869140625, 0.03202009201049805, 0.034033775329589844, 0.03604745864868164, 0.03806114196777344, 0.040074825286865234, 0.04208850860595703, 0.04410219192504883, 0.046115875244140625, 0.04812955856323242, 0.05014324188232422, 0.052156925201416016, 0.05417060852050781, 0.05618429183959961, 0.058197975158691406, 0.0602116584777832, 0.062225341796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 13.0, 8.0, 8.0, 13.0, 23.0, 34.0, 55.0, 72.0, 135.0, 213.0, 427.0, 697.0, 1174.0, 2138.0, 3686.0, 7236.0, 14650.0, 35611.0, 115606.0, 765295.0, 2822666.0, 313240.0, 66723.0, 23496.0, 9953.0, 4900.0, 2651.0, 1418.0, 847.0, 460.0, 290.0, 211.0, 108.0, 62.0, 45.0, 27.0, 24.0, 15.0, 9.0, 9.0, 7.0, 5.0, 7.0, 3.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2412109375, -0.2335052490234375, -0.225799560546875, -0.2180938720703125, -0.21038818359375, -0.2026824951171875, -0.194976806640625, -0.1872711181640625, -0.1795654296875, -0.1718597412109375, -0.164154052734375, -0.1564483642578125, -0.14874267578125, -0.1410369873046875, -0.133331298828125, -0.1256256103515625, -0.117919921875, -0.1102142333984375, -0.102508544921875, -0.0948028564453125, -0.08709716796875, -0.0793914794921875, -0.071685791015625, -0.0639801025390625, -0.0562744140625, -0.0485687255859375, -0.040863037109375, -0.0331573486328125, -0.02545166015625, -0.0177459716796875, -0.010040283203125, -0.0023345947265625, 0.00537109375, 0.0130767822265625, 0.020782470703125, 0.0284881591796875, 0.03619384765625, 0.0438995361328125, 0.051605224609375, 0.0593109130859375, 0.0670166015625, 0.0747222900390625, 0.082427978515625, 0.0901336669921875, 0.09783935546875, 0.1055450439453125, 0.113250732421875, 0.1209564208984375, 0.128662109375, 0.1363677978515625, 0.144073486328125, 0.1517791748046875, 0.15948486328125, 0.1671905517578125, 0.174896240234375, 0.1826019287109375, 0.1903076171875, 0.1980133056640625, 0.205718994140625, 0.2134246826171875, 0.22113037109375, 0.2288360595703125, 0.236541748046875, 0.2442474365234375, 0.251953125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 5.0, 3.0, 9.0, 2.0, 5.0, 9.0, 2.0, 4.0, 9.0, 18.0, 11.0, 18.0, 17.0, 22.0, 41.0, 36.0, 54.0, 101.0, 140.0, 193.0, 428.0, 806.0, 949.0, 463.0, 247.0, 140.0, 101.0, 54.0, 40.0, 28.0, 33.0, 11.0, 16.0, 9.0, 10.0, 12.0, 6.0, 2.0, 4.0, 3.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.09686279296875, -0.09402656555175781, -0.09119033813476562, -0.08835411071777344, -0.08551788330078125, -0.08268165588378906, -0.07984542846679688, -0.07700920104980469, -0.0741729736328125, -0.07133674621582031, -0.06850051879882812, -0.06566429138183594, -0.06282806396484375, -0.05999183654785156, -0.057155609130859375, -0.05431938171386719, -0.051483154296875, -0.04864692687988281, -0.045810699462890625, -0.04297447204589844, -0.04013824462890625, -0.03730201721191406, -0.034465789794921875, -0.03162956237792969, -0.0287933349609375, -0.025957107543945312, -0.023120880126953125, -0.020284652709960938, -0.01744842529296875, -0.014612197875976562, -0.011775970458984375, -0.008939743041992188, -0.006103515625, -0.0032672882080078125, -0.000431060791015625, 0.0024051666259765625, 0.00524139404296875, 0.008077621459960938, 0.010913848876953125, 0.013750076293945312, 0.0165863037109375, 0.019422531127929688, 0.022258758544921875, 0.025094985961914062, 0.02793121337890625, 0.030767440795898438, 0.033603668212890625, 0.03643989562988281, 0.039276123046875, 0.04211235046386719, 0.044948577880859375, 0.04778480529785156, 0.05062103271484375, 0.05345726013183594, 0.056293487548828125, 0.05912971496582031, 0.0619659423828125, 0.06480216979980469, 0.06763839721679688, 0.07047462463378906, 0.07331085205078125, 0.07614707946777344, 0.07898330688476562, 0.08181953430175781, 0.08465576171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 3.0, 16.0, 11.0, 17.0, 24.0, 43.0, 66.0, 76.0, 101.0, 109.0, 137.0, 100.0, 94.0, 65.0, 38.0, 24.0, 19.0, 15.0, 3.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5530398488044739, -0.5374927520751953, -0.5219456553459167, -0.5063984990119934, -0.49085140228271484, -0.4753043055534363, -0.4597572088241577, -0.44421011209487915, -0.4286629855632782, -0.41311588883399963, -0.3975687623023987, -0.3820216655731201, -0.36647456884384155, -0.3509274423122406, -0.33538034558296204, -0.3198332190513611, -0.3042861223220825, -0.28873902559280396, -0.273191899061203, -0.25764480233192444, -0.24209769070148468, -0.22655057907104492, -0.21100348234176636, -0.1954563707113266, -0.17990925908088684, -0.16436214745044708, -0.14881503582000732, -0.13326793909072876, -0.117720827460289, -0.10217371582984924, -0.08662661164999008, -0.07107950747013092, -0.05553239583969116, -0.0399852879345417, -0.024438180029392242, -0.008891072124242783, 0.006656035780906677, 0.022203147411346436, 0.0377502515912056, 0.05329735577106476, 0.06884446740150452, 0.08439157903194427, 0.09993868321180344, 0.1154857873916626, 0.13103289902210236, 0.14658001065254211, 0.16212710738182068, 0.17767421901226044, 0.1932213306427002, 0.20876844227313995, 0.2243155539035797, 0.23986265063285828, 0.25540977716445923, 0.2709568738937378, 0.28650397062301636, 0.3020510673522949, 0.3175981938838959, 0.33314529061317444, 0.3486924171447754, 0.36423951387405396, 0.3797866106033325, 0.39533373713493347, 0.41088083386421204, 0.426427960395813, 0.44197505712509155]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 3.0, 5.0, 7.0, 6.0, 12.0, 7.0, 16.0, 12.0, 15.0, 21.0, 31.0, 36.0, 28.0, 32.0, 37.0, 57.0, 46.0, 54.0, 57.0, 65.0, 51.0, 53.0, 45.0, 47.0, 41.0, 35.0, 31.0, 25.0, 23.0, 21.0, 13.0, 22.0, 9.0, 9.0, 1.0, 4.0, 6.0, 7.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3205842971801758, -0.3089044988155365, -0.2972247302532196, -0.2855449318885803, -0.27386513352394104, -0.26218536496162415, -0.25050556659698486, -0.23882578313350677, -0.2271459996700287, -0.2154662162065506, -0.20378641784191132, -0.19210663437843323, -0.18042685091495514, -0.16874706745147705, -0.15706726908683777, -0.14538748562335968, -0.1337076872587204, -0.12202789634466171, -0.11034811288118362, -0.09866832196712494, -0.08698853850364685, -0.07530874758958817, -0.06362895667552948, -0.05194917321205139, -0.040269382297992706, -0.02858959510922432, -0.016909806057810783, -0.005230017006397247, 0.0064497701823711395, 0.018129557371139526, 0.02980934828519821, 0.0414891317486763, 0.053168922662734985, 0.06484871357679367, 0.07652849704027176, 0.08820828795433044, 0.09988807141780853, 0.11156786233186722, 0.1232476532459259, 0.134927436709404, 0.14660722017288208, 0.15828700363636017, 0.16996680200099945, 0.18164658546447754, 0.19332636892795563, 0.20500615239143372, 0.216685950756073, 0.2283657342195511, 0.24004553258419037, 0.25172531604766846, 0.26340511441230774, 0.275084912776947, 0.2867646813392639, 0.2984444797039032, 0.3101242780685425, 0.3218040466308594, 0.33348384499549866, 0.34516364336013794, 0.35684341192245483, 0.3685232102870941, 0.3802030086517334, 0.3918827772140503, 0.4035625755786896, 0.41524237394332886, 0.42692214250564575]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 7.0, 6.0, 10.0, 19.0, 27.0, 22.0, 49.0, 67.0, 94.0, 143.0, 201.0, 257.0, 387.0, 505.0, 741.0, 1071.0, 1622.0, 2273.0, 3362.0, 5233.0, 8076.0, 13333.0, 24328.0, 93799.0, 764632.0, 71416.0, 21842.0, 12489.0, 7522.0, 4752.0, 3105.0, 2176.0, 1511.0, 1032.0, 677.0, 521.0, 375.0, 290.0, 162.0, 120.0, 98.0, 62.0, 44.0, 37.0, 20.0, 11.0, 8.0, 9.0, 7.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.248291015625, -0.24063682556152344, -0.23298263549804688, -0.2253284454345703, -0.21767425537109375, -0.2100200653076172, -0.20236587524414062, -0.19471168518066406, -0.1870574951171875, -0.17940330505371094, -0.17174911499023438, -0.1640949249267578, -0.15644073486328125, -0.1487865447998047, -0.14113235473632812, -0.13347816467285156, -0.125823974609375, -0.11816978454589844, -0.11051559448242188, -0.10286140441894531, -0.09520721435546875, -0.08755302429199219, -0.07989883422851562, -0.07224464416503906, -0.0645904541015625, -0.05693626403808594, -0.049282073974609375, -0.04162788391113281, -0.03397369384765625, -0.026319503784179688, -0.018665313720703125, -0.011011123657226562, -0.00335693359375, 0.0042972564697265625, 0.011951446533203125, 0.019605636596679688, 0.02725982666015625, 0.03491401672363281, 0.042568206787109375, 0.05022239685058594, 0.0578765869140625, 0.06553077697753906, 0.07318496704101562, 0.08083915710449219, 0.08849334716796875, 0.09614753723144531, 0.10380172729492188, 0.11145591735839844, 0.119110107421875, 0.12676429748535156, 0.13441848754882812, 0.1420726776123047, 0.14972686767578125, 0.1573810577392578, 0.16503524780273438, 0.17268943786621094, 0.1803436279296875, 0.18799781799316406, 0.19565200805664062, 0.2033061981201172, 0.21096038818359375, 0.2186145782470703, 0.22626876831054688, 0.23392295837402344, 0.2415771484375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 7.0, 3.0, 7.0, 3.0, 3.0, 8.0, 8.0, 12.0, 8.0, 9.0, 15.0, 24.0, 57.0, 187.0, 327.0, 169.0, 69.0, 12.0, 10.0, 6.0, 10.0, 4.0, 5.0, 4.0, 5.0, 0.0, 4.0, 4.0, 1.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.057952880859375, -0.05620527267456055, -0.054457664489746094, -0.05271005630493164, -0.05096244812011719, -0.049214839935302734, -0.04746723175048828, -0.04571962356567383, -0.043972015380859375, -0.04222440719604492, -0.04047679901123047, -0.038729190826416016, -0.03698158264160156, -0.03523397445678711, -0.033486366271972656, -0.0317387580871582, -0.02999114990234375, -0.028243541717529297, -0.026495933532714844, -0.02474832534790039, -0.023000717163085938, -0.021253108978271484, -0.01950550079345703, -0.017757892608642578, -0.016010284423828125, -0.014262676239013672, -0.012515068054199219, -0.010767459869384766, -0.009019851684570312, -0.007272243499755859, -0.005524635314941406, -0.003777027130126953, -0.0020294189453125, -0.0002818107604980469, 0.0014657974243164062, 0.0032134056091308594, 0.0049610137939453125, 0.006708621978759766, 0.008456230163574219, 0.010203838348388672, 0.011951446533203125, 0.013699054718017578, 0.015446662902832031, 0.017194271087646484, 0.018941879272460938, 0.02068948745727539, 0.022437095642089844, 0.024184703826904297, 0.02593231201171875, 0.027679920196533203, 0.029427528381347656, 0.03117513656616211, 0.03292274475097656, 0.034670352935791016, 0.03641796112060547, 0.03816556930541992, 0.039913177490234375, 0.04166078567504883, 0.04340839385986328, 0.045156002044677734, 0.04690361022949219, 0.04865121841430664, 0.050398826599121094, 0.05214643478393555, 0.05389404296875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 7.0, 7.0, 14.0, 22.0, 51.0, 96.0, 188.0, 469.0, 1321.0, 4146.0, 16563.0, 87519.0, 537478.0, 335134.0, 50577.0, 10440.0, 2899.0, 927.0, 379.0, 162.0, 75.0, 32.0, 24.0, 5.0, 10.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.404296875, -0.38977813720703125, -0.3752593994140625, -0.36074066162109375, -0.346221923828125, -0.33170318603515625, -0.3171844482421875, -0.30266571044921875, -0.28814697265625, -0.27362823486328125, -0.2591094970703125, -0.24459075927734375, -0.230072021484375, -0.21555328369140625, -0.2010345458984375, -0.18651580810546875, -0.1719970703125, -0.15747833251953125, -0.1429595947265625, -0.12844085693359375, -0.113922119140625, -0.09940338134765625, -0.0848846435546875, -0.07036590576171875, -0.05584716796875, -0.04132843017578125, -0.0268096923828125, -0.01229095458984375, 0.002227783203125, 0.01674652099609375, 0.0312652587890625, 0.04578399658203125, 0.060302734375, 0.07482147216796875, 0.0893402099609375, 0.10385894775390625, 0.118377685546875, 0.13289642333984375, 0.1474151611328125, 0.16193389892578125, 0.17645263671875, 0.19097137451171875, 0.2054901123046875, 0.22000885009765625, 0.234527587890625, 0.24904632568359375, 0.2635650634765625, 0.27808380126953125, 0.2926025390625, 0.30712127685546875, 0.3216400146484375, 0.33615875244140625, 0.350677490234375, 0.36519622802734375, 0.3797149658203125, 0.39423370361328125, 0.40875244140625, 0.42327117919921875, 0.4377899169921875, 0.45230865478515625, 0.466827392578125, 0.48134613037109375, 0.4958648681640625, 0.5103836059570312, 0.52490234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 3.0, 11.0, 12.0, 11.0, 6.0, 16.0, 17.0, 25.0, 22.0, 24.0, 29.0, 28.0, 31.0, 33.0, 31.0, 38.0, 41.0, 49.0, 29.0, 35.0, 48.0, 40.0, 44.0, 36.0, 40.0, 46.0, 35.0, 30.0, 39.0, 20.0, 27.0, 21.0, 8.0, 5.0, 16.0, 10.0, 10.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2451171875, -0.237274169921875, -0.22943115234375, -0.221588134765625, -0.2137451171875, -0.205902099609375, -0.19805908203125, -0.190216064453125, -0.182373046875, -0.174530029296875, -0.16668701171875, -0.158843994140625, -0.1510009765625, -0.143157958984375, -0.13531494140625, -0.127471923828125, -0.11962890625, -0.111785888671875, -0.10394287109375, -0.096099853515625, -0.0882568359375, -0.080413818359375, -0.07257080078125, -0.064727783203125, -0.056884765625, -0.049041748046875, -0.04119873046875, -0.033355712890625, -0.0255126953125, -0.017669677734375, -0.00982666015625, -0.001983642578125, 0.005859375, 0.013702392578125, 0.02154541015625, 0.029388427734375, 0.0372314453125, 0.045074462890625, 0.05291748046875, 0.060760498046875, 0.068603515625, 0.076446533203125, 0.08428955078125, 0.092132568359375, 0.0999755859375, 0.107818603515625, 0.11566162109375, 0.123504638671875, 0.13134765625, 0.139190673828125, 0.14703369140625, 0.154876708984375, 0.1627197265625, 0.170562744140625, 0.17840576171875, 0.186248779296875, 0.194091796875, 0.201934814453125, 0.20977783203125, 0.217620849609375, 0.2254638671875, 0.233306884765625, 0.24114990234375, 0.248992919921875, 0.2568359375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 7.0, 11.0, 7.0, 16.0, 17.0, 29.0, 35.0, 66.0, 87.0, 146.0, 232.0, 406.0, 672.0, 1312.0, 2999.0, 7695.0, 27928.0, 217499.0, 674021.0, 89063.0, 16245.0, 5256.0, 2190.0, 1099.0, 572.0, 337.0, 193.0, 144.0, 81.0, 51.0, 42.0, 30.0, 16.0, 10.0, 14.0, 10.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.26025390625, -0.2528839111328125, -0.245513916015625, -0.2381439208984375, -0.23077392578125, -0.2234039306640625, -0.216033935546875, -0.2086639404296875, -0.2012939453125, -0.1939239501953125, -0.186553955078125, -0.1791839599609375, -0.17181396484375, -0.1644439697265625, -0.157073974609375, -0.1497039794921875, -0.142333984375, -0.1349639892578125, -0.127593994140625, -0.1202239990234375, -0.11285400390625, -0.1054840087890625, -0.098114013671875, -0.0907440185546875, -0.0833740234375, -0.0760040283203125, -0.068634033203125, -0.0612640380859375, -0.05389404296875, -0.0465240478515625, -0.039154052734375, -0.0317840576171875, -0.0244140625, -0.0170440673828125, -0.009674072265625, -0.0023040771484375, 0.00506591796875, 0.0124359130859375, 0.019805908203125, 0.0271759033203125, 0.0345458984375, 0.0419158935546875, 0.049285888671875, 0.0566558837890625, 0.06402587890625, 0.0713958740234375, 0.078765869140625, 0.0861358642578125, 0.093505859375, 0.1008758544921875, 0.108245849609375, 0.1156158447265625, 0.12298583984375, 0.1303558349609375, 0.137725830078125, 0.1450958251953125, 0.1524658203125, 0.1598358154296875, 0.167205810546875, 0.1745758056640625, 0.18194580078125, 0.1893157958984375, 0.196685791015625, 0.2040557861328125, 0.21142578125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 7.0, 6.0, 13.0, 20.0, 33.0, 28.0, 49.0, 39.0, 39.0, 72.0, 82.0, 97.0, 90.0, 98.0, 78.0, 63.0, 50.0, 30.0, 25.0, 21.0, 15.0, 10.0, 9.0, 7.0, 8.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1457672119140625e-05, -2.069026231765747e-05, -1.9922852516174316e-05, -1.9155442714691162e-05, -1.8388032913208008e-05, -1.7620623111724854e-05, -1.68532133102417e-05, -1.6085803508758545e-05, -1.531839370727539e-05, -1.4550983905792236e-05, -1.3783574104309082e-05, -1.3016164302825928e-05, -1.2248754501342773e-05, -1.1481344699859619e-05, -1.0713934898376465e-05, -9.94652509689331e-06, -9.179115295410156e-06, -8.411705493927002e-06, -7.644295692443848e-06, -6.876885890960693e-06, -6.109476089477539e-06, -5.342066287994385e-06, -4.5746564865112305e-06, -3.807246685028076e-06, -3.039836883544922e-06, -2.2724270820617676e-06, -1.5050172805786133e-06, -7.37607479095459e-07, 2.9802322387695312e-08, 7.972121238708496e-07, 1.564621925354004e-06, 2.332031726837158e-06, 3.0994415283203125e-06, 3.866851329803467e-06, 4.634261131286621e-06, 5.401670932769775e-06, 6.16908073425293e-06, 6.936490535736084e-06, 7.703900337219238e-06, 8.471310138702393e-06, 9.238719940185547e-06, 1.0006129741668701e-05, 1.0773539543151855e-05, 1.154094934463501e-05, 1.2308359146118164e-05, 1.3075768947601318e-05, 1.3843178749084473e-05, 1.4610588550567627e-05, 1.537799835205078e-05, 1.6145408153533936e-05, 1.691281795501709e-05, 1.7680227756500244e-05, 1.84476375579834e-05, 1.9215047359466553e-05, 1.9982457160949707e-05, 2.074986696243286e-05, 2.1517276763916016e-05, 2.228468656539917e-05, 2.3052096366882324e-05, 2.381950616836548e-05, 2.4586915969848633e-05, 2.5354325771331787e-05, 2.612173557281494e-05, 2.6889145374298096e-05, 2.765655517578125e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 6.0, 9.0, 10.0, 9.0, 25.0, 37.0, 54.0, 76.0, 121.0, 196.0, 321.0, 545.0, 935.0, 1841.0, 3936.0, 8939.0, 22521.0, 68378.0, 244392.0, 451402.0, 166176.0, 48092.0, 16927.0, 6850.0, 3176.0, 1430.0, 868.0, 493.0, 280.0, 158.0, 133.0, 64.0, 49.0, 29.0, 25.0, 13.0, 13.0, 4.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.129150390625, -0.12475013732910156, -0.12034988403320312, -0.11594963073730469, -0.11154937744140625, -0.10714912414550781, -0.10274887084960938, -0.09834861755371094, -0.0939483642578125, -0.08954811096191406, -0.08514785766601562, -0.08074760437011719, -0.07634735107421875, -0.07194709777832031, -0.06754684448242188, -0.06314659118652344, -0.058746337890625, -0.05434608459472656, -0.049945831298828125, -0.04554557800292969, -0.04114532470703125, -0.03674507141113281, -0.032344818115234375, -0.027944564819335938, -0.0235443115234375, -0.019144058227539062, -0.014743804931640625, -0.010343551635742188, -0.00594329833984375, -0.0015430450439453125, 0.002857208251953125, 0.0072574615478515625, 0.01165771484375, 0.016057968139648438, 0.020458221435546875, 0.024858474731445312, 0.02925872802734375, 0.03365898132324219, 0.038059234619140625, 0.04245948791503906, 0.0468597412109375, 0.05125999450683594, 0.055660247802734375, 0.06006050109863281, 0.06446075439453125, 0.06886100769042969, 0.07326126098632812, 0.07766151428222656, 0.082061767578125, 0.08646202087402344, 0.09086227416992188, 0.09526252746582031, 0.09966278076171875, 0.10406303405761719, 0.10846328735351562, 0.11286354064941406, 0.1172637939453125, 0.12166404724121094, 0.12606430053710938, 0.1304645538330078, 0.13486480712890625, 0.1392650604248047, 0.14366531372070312, 0.14806556701660156, 0.1524658203125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 8.0, 8.0, 12.0, 11.0, 13.0, 20.0, 18.0, 28.0, 39.0, 44.0, 48.0, 55.0, 55.0, 68.0, 60.0, 73.0, 66.0, 44.0, 55.0, 50.0, 42.0, 38.0, 26.0, 22.0, 18.0, 17.0, 12.0, 11.0, 9.0, 9.0, 4.0, 1.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.16845703125, -0.16401958465576172, -0.15958213806152344, -0.15514469146728516, -0.15070724487304688, -0.1462697982788086, -0.1418323516845703, -0.13739490509033203, -0.13295745849609375, -0.12852001190185547, -0.12408256530761719, -0.1196451187133789, -0.11520767211914062, -0.11077022552490234, -0.10633277893066406, -0.10189533233642578, -0.0974578857421875, -0.09302043914794922, -0.08858299255371094, -0.08414554595947266, -0.07970809936523438, -0.0752706527709961, -0.07083320617675781, -0.06639575958251953, -0.06195831298828125, -0.05752086639404297, -0.05308341979980469, -0.048645973205566406, -0.044208526611328125, -0.039771080017089844, -0.03533363342285156, -0.03089618682861328, -0.026458740234375, -0.02202129364013672, -0.017583847045898438, -0.013146400451660156, -0.008708953857421875, -0.004271507263183594, 0.0001659393310546875, 0.004603385925292969, 0.00904083251953125, 0.013478279113769531, 0.017915725708007812, 0.022353172302246094, 0.026790618896484375, 0.031228065490722656, 0.03566551208496094, 0.04010295867919922, 0.0445404052734375, 0.04897785186767578, 0.05341529846191406, 0.057852745056152344, 0.062290191650390625, 0.0667276382446289, 0.07116508483886719, 0.07560253143310547, 0.08003997802734375, 0.08447742462158203, 0.08891487121582031, 0.0933523178100586, 0.09778976440429688, 0.10222721099853516, 0.10666465759277344, 0.11110210418701172, 0.11553955078125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 4.0, 4.0, 10.0, 14.0, 17.0, 27.0, 34.0, 77.0, 140.0, 197.0, 212.0, 111.0, 62.0, 26.0, 17.0, 11.0, 11.0, 5.0, 9.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1132845878601074, -2.012373447418213, -1.911462426185608, -1.8105512857437134, -1.7096402645111084, -1.6087291240692139, -1.5078179836273193, -1.4069069623947144, -1.3059959411621094, -1.2050848007202148, -1.1041737794876099, -1.0032626390457153, -0.9023516178131104, -0.8014404773712158, -0.7005293965339661, -0.5996183156967163, -0.4987071752548218, -0.397796094417572, -0.29688501358032227, -0.19597390294075012, -0.09506282210350037, 0.005848288536071777, 0.10675936937332153, 0.2076704502105713, 0.30858153104782104, 0.4094926118850708, 0.5104036927223206, 0.6113147735595703, 0.7122259140014648, 0.8131369948387146, 0.9140480756759644, 1.0149590969085693, 1.1158702373504639, 1.2167813777923584, 1.3176923990249634, 1.418603539466858, 1.519514560699463, 1.6204257011413574, 1.721336841583252, 1.822247862815857, 1.923158884048462, 2.0240700244903564, 2.124981164932251, 2.2258920669555664, 2.326803207397461, 2.4277143478393555, 2.52862548828125, 2.6295366287231445, 2.730447769165039, 2.8313589096069336, 2.932270050048828, 3.0331809520721436, 3.134092092514038, 3.2350032329559326, 3.335914373397827, 3.4368252754211426, 3.537736415863037, 3.6386475563049316, 3.739558696746826, 3.8404695987701416, 3.941380739212036, 4.042291641235352, 4.143202781677246, 4.244113922119141, 4.345025062561035]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 2.0, 4.0, 3.0, 7.0, 4.0, 4.0, 6.0, 5.0, 12.0, 15.0, 20.0, 34.0, 64.0, 88.0, 129.0, 120.0, 110.0, 106.0, 63.0, 60.0, 39.0, 19.0, 11.0, 7.0, 8.0, 9.0, 4.0, 4.0, 9.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-4.586560249328613, -4.450875759124756, -4.315191268920898, -4.179506778717041, -4.043822288513184, -3.9081380367279053, -3.772453546524048, -3.6367690563201904, -3.501084804534912, -3.3654003143310547, -3.2297158241271973, -3.09403133392334, -2.9583470821380615, -2.822662591934204, -2.6869781017303467, -2.5512936115264893, -2.415609121322632, -2.2799246311187744, -2.144240140914917, -2.0085558891296387, -1.8728713989257812, -1.7371869087219238, -1.6015024185180664, -1.465817928314209, -1.3301335573196411, -1.1944490671157837, -1.0587646961212158, -0.9230802059173584, -0.7873957753181458, -0.6517113447189331, -0.5160268545150757, -0.38034242391586304, -0.2446579933166504, -0.10897354781627655, 0.02671089768409729, 0.16239535808563232, 0.29807978868484497, 0.4337642192840576, 0.569448709487915, 0.7051331400871277, 0.8408175706863403, 0.976502001285553, 1.1121864318847656, 1.247870922088623, 1.3835554122924805, 1.5192397832870483, 1.6549242734909058, 1.7906086444854736, 1.926293134689331, 2.0619776248931885, 2.197662115097046, 2.333346366882324, 2.4690308570861816, 2.604715347290039, 2.7403998374938965, 2.876084327697754, 3.0117688179016113, 3.1474533081054688, 3.283137798309326, 3.4188222885131836, 3.554506540298462, 3.6901910305023193, 3.8258755207061768, 3.961560010910034, 4.0972442626953125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 6.0, 5.0, 8.0, 4.0, 12.0, 12.0, 28.0, 49.0, 89.0, 132.0, 225.0, 516.0, 1070.0, 2585.0, 7887.0, 45067.0, 4039970.0, 84838.0, 7910.0, 2279.0, 838.0, 367.0, 164.0, 107.0, 40.0, 28.0, 17.0, 11.0, 10.0, 3.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6484375, -1.605743408203125, -1.56304931640625, -1.520355224609375, -1.4776611328125, -1.434967041015625, -1.39227294921875, -1.349578857421875, -1.306884765625, -1.264190673828125, -1.22149658203125, -1.178802490234375, -1.1361083984375, -1.093414306640625, -1.05072021484375, -1.008026123046875, -0.96533203125, -0.922637939453125, -0.87994384765625, -0.837249755859375, -0.7945556640625, -0.751861572265625, -0.70916748046875, -0.666473388671875, -0.623779296875, -0.581085205078125, -0.53839111328125, -0.495697021484375, -0.4530029296875, -0.410308837890625, -0.36761474609375, -0.324920654296875, -0.2822265625, -0.239532470703125, -0.19683837890625, -0.154144287109375, -0.1114501953125, -0.068756103515625, -0.02606201171875, 0.016632080078125, 0.059326171875, 0.102020263671875, 0.14471435546875, 0.187408447265625, 0.2301025390625, 0.272796630859375, 0.31549072265625, 0.358184814453125, 0.40087890625, 0.443572998046875, 0.48626708984375, 0.528961181640625, 0.5716552734375, 0.614349365234375, 0.65704345703125, 0.699737548828125, 0.742431640625, 0.785125732421875, 0.82781982421875, 0.870513916015625, 0.9132080078125, 0.955902099609375, 0.99859619140625, 1.041290283203125, 1.083984375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 5.0, 7.0, 10.0, 7.0, 11.0, 11.0, 14.0, 15.0, 26.0, 77.0, 148.0, 211.0, 175.0, 121.0, 56.0, 22.0, 23.0, 12.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0762939453125, -0.0743107795715332, -0.0723276138305664, -0.07034444808959961, -0.06836128234863281, -0.06637811660766602, -0.06439495086669922, -0.06241178512573242, -0.060428619384765625, -0.05844545364379883, -0.05646228790283203, -0.054479122161865234, -0.05249595642089844, -0.05051279067993164, -0.048529624938964844, -0.04654645919799805, -0.04456329345703125, -0.04258012771606445, -0.040596961975097656, -0.03861379623413086, -0.03663063049316406, -0.034647464752197266, -0.03266429901123047, -0.030681133270263672, -0.028697967529296875, -0.026714801788330078, -0.02473163604736328, -0.022748470306396484, -0.020765304565429688, -0.01878213882446289, -0.016798973083496094, -0.014815807342529297, -0.0128326416015625, -0.010849475860595703, -0.008866310119628906, -0.006883144378662109, -0.0048999786376953125, -0.0029168128967285156, -0.0009336471557617188, 0.0010495185852050781, 0.003032684326171875, 0.005015850067138672, 0.006999015808105469, 0.008982181549072266, 0.010965347290039062, 0.01294851303100586, 0.014931678771972656, 0.016914844512939453, 0.01889801025390625, 0.020881175994873047, 0.022864341735839844, 0.02484750747680664, 0.026830673217773438, 0.028813838958740234, 0.03079700469970703, 0.03278017044067383, 0.034763336181640625, 0.03674650192260742, 0.03872966766357422, 0.040712833404541016, 0.04269599914550781, 0.04467916488647461, 0.046662330627441406, 0.0486454963684082, 0.050628662109375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 8.0, 18.0, 21.0, 36.0, 60.0, 72.0, 128.0, 212.0, 309.0, 561.0, 920.0, 1715.0, 3214.0, 6040.0, 13258.0, 34737.0, 141432.0, 3066853.0, 802629.0, 78034.0, 23611.0, 9807.0, 4640.0, 2492.0, 1451.0, 785.0, 473.0, 288.0, 177.0, 114.0, 61.0, 41.0, 27.0, 13.0, 15.0, 19.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.38238525390625, -0.3663330078125, -0.35028076171875, -0.334228515625, -0.31817626953125, -0.3021240234375, -0.28607177734375, -0.27001953125, -0.25396728515625, -0.2379150390625, -0.22186279296875, -0.205810546875, -0.18975830078125, -0.1737060546875, -0.15765380859375, -0.1416015625, -0.12554931640625, -0.1094970703125, -0.09344482421875, -0.077392578125, -0.06134033203125, -0.0452880859375, -0.02923583984375, -0.01318359375, 0.00286865234375, 0.0189208984375, 0.03497314453125, 0.051025390625, 0.06707763671875, 0.0831298828125, 0.09918212890625, 0.115234375, 0.13128662109375, 0.1473388671875, 0.16339111328125, 0.179443359375, 0.19549560546875, 0.2115478515625, 0.22760009765625, 0.24365234375, 0.25970458984375, 0.2757568359375, 0.29180908203125, 0.307861328125, 0.32391357421875, 0.3399658203125, 0.35601806640625, 0.3720703125, 0.38812255859375, 0.4041748046875, 0.42022705078125, 0.436279296875, 0.45233154296875, 0.4683837890625, 0.48443603515625, 0.50048828125, 0.51654052734375, 0.5325927734375, 0.54864501953125, 0.564697265625, 0.58074951171875, 0.5968017578125, 0.61285400390625, 0.62890625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 4.0, 2.0, 5.0, 9.0, 12.0, 11.0, 16.0, 21.0, 22.0, 37.0, 58.0, 110.0, 193.0, 512.0, 1763.0, 729.0, 246.0, 105.0, 63.0, 35.0, 29.0, 19.0, 9.0, 11.0, 3.0, 10.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0938720703125, -0.09090232849121094, -0.08793258666992188, -0.08496284484863281, -0.08199310302734375, -0.07902336120605469, -0.07605361938476562, -0.07308387756347656, -0.0701141357421875, -0.06714439392089844, -0.06417465209960938, -0.06120491027832031, -0.05823516845703125, -0.05526542663574219, -0.052295684814453125, -0.04932594299316406, -0.046356201171875, -0.04338645935058594, -0.040416717529296875, -0.03744697570800781, -0.03447723388671875, -0.03150749206542969, -0.028537750244140625, -0.025568008422851562, -0.0225982666015625, -0.019628524780273438, -0.016658782958984375, -0.013689041137695312, -0.01071929931640625, -0.0077495574951171875, -0.004779815673828125, -0.0018100738525390625, 0.00115966796875, 0.0041294097900390625, 0.007099151611328125, 0.010068893432617188, 0.01303863525390625, 0.016008377075195312, 0.018978118896484375, 0.021947860717773438, 0.0249176025390625, 0.027887344360351562, 0.030857086181640625, 0.03382682800292969, 0.03679656982421875, 0.03976631164550781, 0.042736053466796875, 0.04570579528808594, 0.048675537109375, 0.05164527893066406, 0.054615020751953125, 0.05758476257324219, 0.06055450439453125, 0.06352424621582031, 0.06649398803710938, 0.06946372985839844, 0.0724334716796875, 0.07540321350097656, 0.07837295532226562, 0.08134269714355469, 0.08431243896484375, 0.08728218078613281, 0.09025192260742188, 0.09322166442871094, 0.09619140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 16.0, 62.0, 265.0, 438.0, 157.0, 38.0, 14.0, 11.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4757307767868042, -0.4336422383785248, -0.39155369997024536, -0.34946519136428833, -0.3073766529560089, -0.2652881145477295, -0.22319960594177246, -0.18111106753349304, -0.13902252912521362, -0.0969339981675148, -0.05484546720981598, -0.012756943702697754, 0.029331594705581665, 0.07142013311386108, 0.11350864171981812, 0.15559718012809753, 0.19768571853637695, 0.23977425694465637, 0.2818627953529358, 0.3239513039588928, 0.36603984236717224, 0.40812838077545166, 0.4502168893814087, 0.4923054277896881, 0.5343939661979675, 0.5764824748039246, 0.6185710430145264, 0.6606595516204834, 0.7027480602264404, 0.7448366284370422, 0.7869251370429993, 0.8290137052536011, 0.8711020946502686, 0.9131906032562256, 0.9552791714668274, 0.9973676800727844, 1.0394562482833862, 1.0815447568893433, 1.1236332654953003, 1.1657217741012573, 1.207810401916504, 1.249898910522461, 1.291987419128418, 1.334075927734375, 1.3761645555496216, 1.4182530641555786, 1.4603415727615356, 1.5024300813674927, 1.5445185899734497, 1.5866070985794067, 1.6286956071853638, 1.6707842350006104, 1.7128727436065674, 1.7549612522125244, 1.7970497608184814, 1.8391382694244385, 1.8812267780303955, 1.9233152866363525, 1.9654037952423096, 2.0074923038482666, 2.0495808124542236, 2.0916695594787598, 2.133758068084717, 2.175846576690674, 2.217935085296631]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 8.0, 1.0, 6.0, 0.0, 4.0, 8.0, 14.0, 19.0, 25.0, 31.0, 55.0, 78.0, 111.0, 125.0, 98.0, 109.0, 83.0, 73.0, 33.0, 34.0, 23.0, 11.0, 6.0, 9.0, 10.0, 4.0, 6.0, 4.0, 5.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.41335439682006836, -0.39719825983047485, -0.38104209303855896, -0.36488595604896545, -0.34872978925704956, -0.33257365226745605, -0.31641751527786255, -0.30026134848594666, -0.28410518169403076, -0.26794904470443726, -0.25179287791252136, -0.23563674092292786, -0.21948057413101196, -0.20332443714141846, -0.18716828525066376, -0.17101213335990906, -0.15485599637031555, -0.13869984447956085, -0.12254369258880615, -0.10638754814863205, -0.09023139625787735, -0.07407524436712265, -0.05791909992694855, -0.04176294803619385, -0.025606796145439148, -0.009450646117329597, 0.006705503910779953, 0.022861652076244354, 0.039017803966999054, 0.055173955857753754, 0.07133010029792786, 0.08748625218868256, 0.10364240407943726, 0.11979855597019196, 0.13595470786094666, 0.15211084485054016, 0.16826701164245605, 0.18442314863204956, 0.20057930052280426, 0.21673545241355896, 0.23289160430431366, 0.24904775619506836, 0.26520389318466187, 0.28136005997657776, 0.29751619696617126, 0.31367236375808716, 0.32982850074768066, 0.34598463773727417, 0.36214080452919006, 0.37829694151878357, 0.39445310831069946, 0.41060924530029297, 0.42676541209220886, 0.44292154908180237, 0.45907771587371826, 0.47523385286331177, 0.4913899898529053, 0.5075461268424988, 0.5237022638320923, 0.5398584604263306, 0.5560145974159241, 0.5721707344055176, 0.5883268713951111, 0.6044830083847046, 0.6206392049789429]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 16.0, 23.0, 43.0, 67.0, 108.0, 177.0, 280.0, 469.0, 805.0, 1353.0, 2417.0, 4216.0, 8024.0, 17184.0, 50952.0, 281007.0, 537747.0, 94174.0, 25810.0, 10808.0, 5471.0, 3102.0, 1711.0, 1063.0, 594.0, 376.0, 187.0, 118.0, 78.0, 53.0, 31.0, 23.0, 10.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 4.0, 3.0, 3.0, 0.0, 5.0], "bins": [-0.323974609375, -0.31502723693847656, -0.3060798645019531, -0.2971324920654297, -0.28818511962890625, -0.2792377471923828, -0.2702903747558594, -0.26134300231933594, -0.2523956298828125, -0.24344825744628906, -0.23450088500976562, -0.2255535125732422, -0.21660614013671875, -0.2076587677001953, -0.19871139526367188, -0.18976402282714844, -0.180816650390625, -0.17186927795410156, -0.16292190551757812, -0.1539745330810547, -0.14502716064453125, -0.1360797882080078, -0.12713241577148438, -0.11818504333496094, -0.1092376708984375, -0.10029029846191406, -0.09134292602539062, -0.08239555358886719, -0.07344818115234375, -0.06450080871582031, -0.055553436279296875, -0.04660606384277344, -0.03765869140625, -0.028711318969726562, -0.019763946533203125, -0.010816574096679688, -0.00186920166015625, 0.0070781707763671875, 0.016025543212890625, 0.024972915649414062, 0.0339202880859375, 0.04286766052246094, 0.051815032958984375, 0.06076240539550781, 0.06970977783203125, 0.07865715026855469, 0.08760452270507812, 0.09655189514160156, 0.105499267578125, 0.11444664001464844, 0.12339401245117188, 0.1323413848876953, 0.14128875732421875, 0.1502361297607422, 0.15918350219726562, 0.16813087463378906, 0.1770782470703125, 0.18602561950683594, 0.19497299194335938, 0.2039203643798828, 0.21286773681640625, 0.2218151092529297, 0.23076248168945312, 0.23970985412597656, 0.2486572265625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 6.0, 0.0, 5.0, 5.0, 7.0, 5.0, 4.0, 5.0, 6.0, 3.0, 13.0, 17.0, 24.0, 23.0, 47.0, 57.0, 92.0, 106.0, 150.0, 119.0, 97.0, 75.0, 44.0, 18.0, 26.0, 7.0, 3.0, 3.0, 7.0, 7.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0386962890625, -0.03749704360961914, -0.03629779815673828, -0.03509855270385742, -0.03389930725097656, -0.0327000617980957, -0.031500816345214844, -0.030301570892333984, -0.029102325439453125, -0.027903079986572266, -0.026703834533691406, -0.025504589080810547, -0.024305343627929688, -0.023106098175048828, -0.02190685272216797, -0.02070760726928711, -0.01950836181640625, -0.01830911636352539, -0.01710987091064453, -0.015910625457763672, -0.014711380004882812, -0.013512134552001953, -0.012312889099121094, -0.011113643646240234, -0.009914398193359375, -0.008715152740478516, -0.007515907287597656, -0.006316661834716797, -0.0051174163818359375, -0.003918170928955078, -0.0027189254760742188, -0.0015196800231933594, -0.0003204345703125, 0.0008788108825683594, 0.0020780563354492188, 0.003277301788330078, 0.0044765472412109375, 0.005675792694091797, 0.006875038146972656, 0.008074283599853516, 0.009273529052734375, 0.010472774505615234, 0.011672019958496094, 0.012871265411376953, 0.014070510864257812, 0.015269756317138672, 0.01646900177001953, 0.01766824722290039, 0.01886749267578125, 0.02006673812866211, 0.02126598358154297, 0.022465229034423828, 0.023664474487304688, 0.024863719940185547, 0.026062965393066406, 0.027262210845947266, 0.028461456298828125, 0.029660701751708984, 0.030859947204589844, 0.0320591926574707, 0.03325843811035156, 0.03445768356323242, 0.03565692901611328, 0.03685617446899414, 0.038055419921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 4.0, 7.0, 8.0, 12.0, 33.0, 196.0, 2703.0, 77494.0, 882484.0, 82279.0, 2994.0, 253.0, 40.0, 14.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.85205078125, -0.825836181640625, -0.79962158203125, -0.773406982421875, -0.7471923828125, -0.720977783203125, -0.69476318359375, -0.668548583984375, -0.642333984375, -0.616119384765625, -0.58990478515625, -0.563690185546875, -0.5374755859375, -0.511260986328125, -0.48504638671875, -0.458831787109375, -0.4326171875, -0.406402587890625, -0.38018798828125, -0.353973388671875, -0.3277587890625, -0.301544189453125, -0.27532958984375, -0.249114990234375, -0.222900390625, -0.196685791015625, -0.17047119140625, -0.144256591796875, -0.1180419921875, -0.091827392578125, -0.06561279296875, -0.039398193359375, -0.01318359375, 0.013031005859375, 0.03924560546875, 0.065460205078125, 0.0916748046875, 0.117889404296875, 0.14410400390625, 0.170318603515625, 0.196533203125, 0.222747802734375, 0.24896240234375, 0.275177001953125, 0.3013916015625, 0.327606201171875, 0.35382080078125, 0.380035400390625, 0.40625, 0.432464599609375, 0.45867919921875, 0.484893798828125, 0.5111083984375, 0.537322998046875, 0.56353759765625, 0.589752197265625, 0.615966796875, 0.642181396484375, 0.66839599609375, 0.694610595703125, 0.7208251953125, 0.747039794921875, 0.77325439453125, 0.799468994140625, 0.82568359375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 8.0, 4.0, 5.0, 8.0, 7.0, 10.0, 15.0, 12.0, 9.0, 18.0, 24.0, 22.0, 24.0, 30.0, 26.0, 29.0, 39.0, 42.0, 42.0, 33.0, 42.0, 47.0, 40.0, 51.0, 39.0, 33.0, 35.0, 27.0, 37.0, 24.0, 34.0, 26.0, 30.0, 22.0, 16.0, 23.0, 13.0, 8.0, 13.0, 3.0, 5.0, 9.0, 6.0, 8.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12359619140625, -0.11932659149169922, -0.11505699157714844, -0.11078739166259766, -0.10651779174804688, -0.1022481918334961, -0.09797859191894531, -0.09370899200439453, -0.08943939208984375, -0.08516979217529297, -0.08090019226074219, -0.0766305923461914, -0.07236099243164062, -0.06809139251708984, -0.06382179260253906, -0.05955219268798828, -0.0552825927734375, -0.05101299285888672, -0.04674339294433594, -0.042473793029785156, -0.038204193115234375, -0.033934593200683594, -0.029664993286132812, -0.02539539337158203, -0.02112579345703125, -0.01685619354248047, -0.012586593627929688, -0.008316993713378906, -0.004047393798828125, 0.00022220611572265625, 0.0044918060302734375, 0.008761405944824219, 0.013031005859375, 0.01730060577392578, 0.021570205688476562, 0.025839805603027344, 0.030109405517578125, 0.034379005432128906, 0.03864860534667969, 0.04291820526123047, 0.04718780517578125, 0.05145740509033203, 0.05572700500488281, 0.059996604919433594, 0.06426620483398438, 0.06853580474853516, 0.07280540466308594, 0.07707500457763672, 0.0813446044921875, 0.08561420440673828, 0.08988380432128906, 0.09415340423583984, 0.09842300415039062, 0.1026926040649414, 0.10696220397949219, 0.11123180389404297, 0.11550140380859375, 0.11977100372314453, 0.12404060363769531, 0.1283102035522461, 0.13257980346679688, 0.13684940338134766, 0.14111900329589844, 0.14538860321044922, 0.149658203125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 8.0, 11.0, 28.0, 48.0, 365.0, 621121.0, 426487.0, 377.0, 62.0, 20.0, 3.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30859375, -3.21124267578125, -3.1138916015625, -3.01654052734375, -2.919189453125, -2.82183837890625, -2.7244873046875, -2.62713623046875, -2.52978515625, -2.43243408203125, -2.3350830078125, -2.23773193359375, -2.140380859375, -2.04302978515625, -1.9456787109375, -1.84832763671875, -1.7509765625, -1.65362548828125, -1.5562744140625, -1.45892333984375, -1.361572265625, -1.26422119140625, -1.1668701171875, -1.06951904296875, -0.97216796875, -0.87481689453125, -0.7774658203125, -0.68011474609375, -0.582763671875, -0.48541259765625, -0.3880615234375, -0.29071044921875, -0.193359375, -0.09600830078125, 0.0013427734375, 0.09869384765625, 0.196044921875, 0.29339599609375, 0.3907470703125, 0.48809814453125, 0.58544921875, 0.68280029296875, 0.7801513671875, 0.87750244140625, 0.974853515625, 1.07220458984375, 1.1695556640625, 1.26690673828125, 1.3642578125, 1.46160888671875, 1.5589599609375, 1.65631103515625, 1.753662109375, 1.85101318359375, 1.9483642578125, 2.04571533203125, 2.14306640625, 2.24041748046875, 2.3377685546875, 2.43511962890625, 2.532470703125, 2.62982177734375, 2.7271728515625, 2.82452392578125, 2.921875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 5.0, 9.0, 5.0, 5.0, 4.0, 9.0, 9.0, 14.0, 16.0, 22.0, 34.0, 69.0, 96.0, 174.0, 172.0, 134.0, 64.0, 48.0, 23.0, 25.0, 11.0, 12.0, 7.0, 3.0, 3.0, 7.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.00010007619857788086, -9.714718908071518e-05, -9.42181795835495e-05, -9.128917008638382e-05, -8.836016058921814e-05, -8.543115109205246e-05, -8.250214159488678e-05, -7.95731320977211e-05, -7.664412260055542e-05, -7.371511310338974e-05, -7.078610360622406e-05, -6.785709410905838e-05, -6.49280846118927e-05, -6.199907511472702e-05, -5.907006561756134e-05, -5.614105612039566e-05, -5.321204662322998e-05, -5.02830371260643e-05, -4.735402762889862e-05, -4.442501813173294e-05, -4.149600863456726e-05, -3.856699913740158e-05, -3.56379896402359e-05, -3.270898014307022e-05, -2.977997064590454e-05, -2.685096114873886e-05, -2.392195165157318e-05, -2.09929421544075e-05, -1.806393265724182e-05, -1.5134923160076141e-05, -1.2205913662910461e-05, -9.276904165744781e-06, -6.3478946685791016e-06, -3.4188851714134216e-06, -4.898756742477417e-07, 2.4391338229179382e-06, 5.368143320083618e-06, 8.297152817249298e-06, 1.1226162314414978e-05, 1.4155171811580658e-05, 1.7084181308746338e-05, 2.0013190805912018e-05, 2.2942200303077698e-05, 2.5871209800243378e-05, 2.8800219297409058e-05, 3.172922879457474e-05, 3.465823829174042e-05, 3.75872477889061e-05, 4.051625728607178e-05, 4.344526678323746e-05, 4.637427628040314e-05, 4.930328577756882e-05, 5.22322952747345e-05, 5.516130477190018e-05, 5.809031426906586e-05, 6.101932376623154e-05, 6.394833326339722e-05, 6.68773427605629e-05, 6.980635225772858e-05, 7.273536175489426e-05, 7.566437125205994e-05, 7.859338074922562e-05, 8.15223902463913e-05, 8.445139974355698e-05, 8.738040924072266e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 2.0, 3.0, 12.0, 7.0, 15.0, 26.0, 27.0, 48.0, 71.0, 100.0, 207.0, 387.0, 714.0, 1734.0, 5468.0, 22569.0, 136632.0, 587262.0, 243520.0, 37224.0, 8208.0, 2465.0, 929.0, 415.0, 196.0, 115.0, 51.0, 41.0, 35.0, 20.0, 13.0, 9.0, 11.0, 5.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.397216796875, -0.3863792419433594, -0.37554168701171875, -0.3647041320800781, -0.3538665771484375, -0.3430290222167969, -0.33219146728515625, -0.3213539123535156, -0.310516357421875, -0.2996788024902344, -0.28884124755859375, -0.2780036926269531, -0.2671661376953125, -0.2563285827636719, -0.24549102783203125, -0.23465347290039062, -0.22381591796875, -0.21297836303710938, -0.20214080810546875, -0.19130325317382812, -0.1804656982421875, -0.16962814331054688, -0.15879058837890625, -0.14795303344726562, -0.137115478515625, -0.12627792358398438, -0.11544036865234375, -0.10460281372070312, -0.0937652587890625, -0.08292770385742188, -0.07209014892578125, -0.061252593994140625, -0.0504150390625, -0.039577484130859375, -0.02873992919921875, -0.017902374267578125, -0.0070648193359375, 0.003772735595703125, 0.01461029052734375, 0.025447845458984375, 0.036285400390625, 0.047122955322265625, 0.05796051025390625, 0.06879806518554688, 0.0796356201171875, 0.09047317504882812, 0.10131072998046875, 0.11214828491210938, 0.12298583984375, 0.13382339477539062, 0.14466094970703125, 0.15549850463867188, 0.1663360595703125, 0.17717361450195312, 0.18801116943359375, 0.19884872436523438, 0.209686279296875, 0.22052383422851562, 0.23136138916015625, 0.24219894409179688, 0.2530364990234375, 0.2638740539550781, 0.27471160888671875, 0.2855491638183594, 0.29638671875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 4.0, 7.0, 11.0, 9.0, 16.0, 25.0, 29.0, 42.0, 48.0, 73.0, 87.0, 90.0, 105.0, 95.0, 64.0, 84.0, 54.0, 53.0, 26.0, 30.0, 19.0, 7.0, 15.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.27734375, -0.2707023620605469, -0.26406097412109375, -0.2574195861816406, -0.2507781982421875, -0.24413681030273438, -0.23749542236328125, -0.23085403442382812, -0.224212646484375, -0.21757125854492188, -0.21092987060546875, -0.20428848266601562, -0.1976470947265625, -0.19100570678710938, -0.18436431884765625, -0.17772293090820312, -0.17108154296875, -0.16444015502929688, -0.15779876708984375, -0.15115737915039062, -0.1445159912109375, -0.13787460327148438, -0.13123321533203125, -0.12459182739257812, -0.117950439453125, -0.11130905151367188, -0.10466766357421875, -0.09802627563476562, -0.0913848876953125, -0.08474349975585938, -0.07810211181640625, -0.07146072387695312, -0.0648193359375, -0.058177947998046875, -0.05153656005859375, -0.044895172119140625, -0.0382537841796875, -0.031612396240234375, -0.02497100830078125, -0.018329620361328125, -0.011688232421875, -0.005046844482421875, 0.00159454345703125, 0.008235931396484375, 0.0148773193359375, 0.021518707275390625, 0.02816009521484375, 0.034801483154296875, 0.04144287109375, 0.048084259033203125, 0.05472564697265625, 0.061367034912109375, 0.0680084228515625, 0.07464981079101562, 0.08129119873046875, 0.08793258666992188, 0.094573974609375, 0.10121536254882812, 0.10785675048828125, 0.11449813842773438, 0.1211395263671875, 0.12778091430664062, 0.13442230224609375, 0.14106369018554688, 0.147705078125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 19.0, 28.0, 66.0, 123.0, 191.0, 228.0, 192.0, 64.0, 41.0, 16.0, 13.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8869035243988037, -2.809570074081421, -2.732236862182617, -2.6549034118652344, -2.5775699615478516, -2.5002365112304688, -2.422903299331665, -2.3455698490142822, -2.2682366371154785, -2.1909031867980957, -2.113569974899292, -2.036236524581909, -1.9589030742645264, -1.881569743156433, -1.8042364120483398, -1.726902961730957, -1.6495695114135742, -1.572236180305481, -1.4949027299880981, -1.4175693988800049, -1.340235948562622, -1.2629026174545288, -1.1855692863464355, -1.1082358360290527, -1.0309025049209595, -0.9535691142082214, -0.8762357234954834, -0.7989023923873901, -0.7215690016746521, -0.6442356109619141, -0.5669022798538208, -0.48956888914108276, -0.41223573684692383, -0.3349023461341858, -0.25756898522377014, -0.1802356094121933, -0.10290223360061646, -0.025568842887878418, 0.05176451802253723, 0.12909787893295288, 0.20643126964569092, 0.28376466035842896, 0.3610980212688446, 0.43843138217926025, 0.5157647728919983, 0.5930981636047363, 0.6704314947128296, 0.7477648854255676, 0.8250982761383057, 0.9024316668510437, 0.9797650575637817, 1.057098388671875, 1.1344318389892578, 1.211765170097351, 1.2890985012054443, 1.3664319515228271, 1.4437652826309204, 1.5210986137390137, 1.5984320640563965, 1.6757653951644897, 1.753098726272583, 1.8304321765899658, 1.907765507698059, 1.9850988388061523, 2.062432289123535]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 9.0, 10.0, 12.0, 22.0, 30.0, 34.0, 74.0, 88.0, 97.0, 112.0, 108.0, 105.0, 88.0, 57.0, 46.0, 33.0, 16.0, 19.0, 13.0, 10.0, 3.0, 3.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9837837219238281, -1.9147576093673706, -1.845731496810913, -1.7767053842544556, -1.707679271697998, -1.63865327835083, -1.5696271657943726, -1.500601053237915, -1.4315749406814575, -1.362548828125, -1.2935227155685425, -1.224496603012085, -1.155470609664917, -1.08644437789917, -1.017418384552002, -0.9483922719955444, -0.8793661594390869, -0.8103400468826294, -0.7413139343261719, -0.6722878813743591, -0.6032617688179016, -0.5342356562614441, -0.46520957350730896, -0.39618349075317383, -0.3271573781967163, -0.2581312656402588, -0.18910518288612366, -0.12007908523082733, -0.051052987575531006, 0.017973124980926514, 0.08699920773506165, 0.15602529048919678, 0.2250516414642334, 0.2940777540206909, 0.36310383677482605, 0.4321299195289612, 0.5011560320854187, 0.5701821446418762, 0.639208197593689, 0.7082343101501465, 0.777260422706604, 0.8462865352630615, 0.915312647819519, 0.9843387007713318, 1.0533647537231445, 1.1223909854888916, 1.1914169788360596, 1.260443091392517, 1.3294692039489746, 1.3984953165054321, 1.4675214290618896, 1.5365475416183472, 1.6055736541748047, 1.6745996475219727, 1.7436257600784302, 1.8126518726348877, 1.8816779851913452, 1.9507040977478027, 2.0197300910949707, 2.0887563228607178, 2.1577823162078857, 2.226808547973633, 2.295834541320801, 2.3648605346679688, 2.433886766433716]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 5.0, 3.0, 3.0, 6.0, 4.0, 14.0, 12.0, 26.0, 21.0, 44.0, 65.0, 85.0, 119.0, 207.0, 322.0, 498.0, 862.0, 1555.0, 3022.0, 6454.0, 18310.0, 88566.0, 3756438.0, 270862.0, 30127.0, 8752.0, 3551.0, 1731.0, 923.0, 563.0, 318.0, 246.0, 153.0, 96.0, 93.0, 57.0, 49.0, 29.0, 32.0, 15.0, 8.0, 12.0, 5.0, 7.0, 6.0, 2.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0], "bins": [-0.8583984375, -0.8321456909179688, -0.8058929443359375, -0.7796401977539062, -0.753387451171875, -0.7271347045898438, -0.7008819580078125, -0.6746292114257812, -0.64837646484375, -0.6221237182617188, -0.5958709716796875, -0.5696182250976562, -0.543365478515625, -0.5171127319335938, -0.4908599853515625, -0.46460723876953125, -0.4383544921875, -0.41210174560546875, -0.3858489990234375, -0.35959625244140625, -0.333343505859375, -0.30709075927734375, -0.2808380126953125, -0.25458526611328125, -0.22833251953125, -0.20207977294921875, -0.1758270263671875, -0.14957427978515625, -0.123321533203125, -0.09706878662109375, -0.0708160400390625, -0.04456329345703125, -0.018310546875, 0.00794219970703125, 0.0341949462890625, 0.06044769287109375, 0.086700439453125, 0.11295318603515625, 0.1392059326171875, 0.16545867919921875, 0.19171142578125, 0.21796417236328125, 0.2442169189453125, 0.27046966552734375, 0.296722412109375, 0.32297515869140625, 0.3492279052734375, 0.37548065185546875, 0.4017333984375, 0.42798614501953125, 0.4542388916015625, 0.48049163818359375, 0.506744384765625, 0.5329971313476562, 0.5592498779296875, 0.5855026245117188, 0.61175537109375, 0.6380081176757812, 0.6642608642578125, 0.6905136108398438, 0.716766357421875, 0.7430191040039062, 0.7692718505859375, 0.7955245971679688, 0.82177734375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 12.0, 7.0, 12.0, 14.0, 17.0, 19.0, 34.0, 40.0, 68.0, 73.0, 91.0, 108.0, 107.0, 99.0, 76.0, 59.0, 44.0, 23.0, 17.0, 17.0, 14.0, 10.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03656005859375, -0.03540802001953125, -0.0342559814453125, -0.03310394287109375, -0.031951904296875, -0.03079986572265625, -0.0296478271484375, -0.02849578857421875, -0.02734375, -0.02619171142578125, -0.0250396728515625, -0.02388763427734375, -0.022735595703125, -0.02158355712890625, -0.0204315185546875, -0.01927947998046875, -0.01812744140625, -0.01697540283203125, -0.0158233642578125, -0.01467132568359375, -0.013519287109375, -0.01236724853515625, -0.0112152099609375, -0.01006317138671875, -0.0089111328125, -0.00775909423828125, -0.0066070556640625, -0.00545501708984375, -0.004302978515625, -0.00315093994140625, -0.0019989013671875, -0.00084686279296875, 0.00030517578125, 0.00145721435546875, 0.0026092529296875, 0.00376129150390625, 0.004913330078125, 0.00606536865234375, 0.0072174072265625, 0.00836944580078125, 0.009521484375, 0.01067352294921875, 0.0118255615234375, 0.01297760009765625, 0.014129638671875, 0.01528167724609375, 0.0164337158203125, 0.01758575439453125, 0.01873779296875, 0.01988983154296875, 0.0210418701171875, 0.02219390869140625, 0.023345947265625, 0.02449798583984375, 0.0256500244140625, 0.02680206298828125, 0.0279541015625, 0.02910614013671875, 0.0302581787109375, 0.03141021728515625, 0.032562255859375, 0.03371429443359375, 0.0348663330078125, 0.03601837158203125, 0.03717041015625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 0.0, 4.0, 4.0, 6.0, 8.0, 5.0, 15.0, 13.0, 15.0, 19.0, 37.0, 51.0, 61.0, 167.0, 423.0, 2149.0, 63691.0, 4090029.0, 35236.0, 1679.0, 359.0, 115.0, 60.0, 36.0, 26.0, 25.0, 16.0, 13.0, 10.0, 3.0, 4.0, 5.0, 0.0, 1.0, 4.0, 2.0, 1.0], "bins": [-2.75, -2.6881103515625, -2.626220703125, -2.5643310546875, -2.50244140625, -2.4405517578125, -2.378662109375, -2.3167724609375, -2.2548828125, -2.1929931640625, -2.131103515625, -2.0692138671875, -2.00732421875, -1.9454345703125, -1.883544921875, -1.8216552734375, -1.759765625, -1.6978759765625, -1.635986328125, -1.5740966796875, -1.51220703125, -1.4503173828125, -1.388427734375, -1.3265380859375, -1.2646484375, -1.2027587890625, -1.140869140625, -1.0789794921875, -1.01708984375, -0.9552001953125, -0.893310546875, -0.8314208984375, -0.76953125, -0.7076416015625, -0.645751953125, -0.5838623046875, -0.52197265625, -0.4600830078125, -0.398193359375, -0.3363037109375, -0.2744140625, -0.2125244140625, -0.150634765625, -0.0887451171875, -0.02685546875, 0.0350341796875, 0.096923828125, 0.1588134765625, 0.220703125, 0.2825927734375, 0.344482421875, 0.4063720703125, 0.46826171875, 0.5301513671875, 0.592041015625, 0.6539306640625, 0.7158203125, 0.7777099609375, 0.839599609375, 0.9014892578125, 0.96337890625, 1.0252685546875, 1.087158203125, 1.1490478515625, 1.2109375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 6.0, 7.0, 12.0, 8.0, 10.0, 14.0, 24.0, 31.0, 47.0, 86.0, 153.0, 324.0, 894.0, 1441.0, 435.0, 208.0, 125.0, 74.0, 56.0, 34.0, 22.0, 16.0, 10.0, 12.0, 8.0, 5.0, 3.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.10888671875, -0.10595989227294922, -0.10303306579589844, -0.10010623931884766, -0.09717941284179688, -0.0942525863647461, -0.09132575988769531, -0.08839893341064453, -0.08547210693359375, -0.08254528045654297, -0.07961845397949219, -0.0766916275024414, -0.07376480102539062, -0.07083797454833984, -0.06791114807128906, -0.06498432159423828, -0.0620574951171875, -0.05913066864013672, -0.05620384216308594, -0.053277015686035156, -0.050350189208984375, -0.047423362731933594, -0.04449653625488281, -0.04156970977783203, -0.03864288330078125, -0.03571605682373047, -0.03278923034667969, -0.029862403869628906, -0.026935577392578125, -0.024008750915527344, -0.021081924438476562, -0.01815509796142578, -0.015228271484375, -0.012301445007324219, -0.009374618530273438, -0.006447792053222656, -0.003520965576171875, -0.0005941390991210938, 0.0023326873779296875, 0.005259513854980469, 0.00818634033203125, 0.011113166809082031, 0.014039993286132812, 0.016966819763183594, 0.019893646240234375, 0.022820472717285156, 0.025747299194335938, 0.02867412567138672, 0.0316009521484375, 0.03452777862548828, 0.03745460510253906, 0.040381431579589844, 0.043308258056640625, 0.046235084533691406, 0.04916191101074219, 0.05208873748779297, 0.05501556396484375, 0.05794239044189453, 0.06086921691894531, 0.0637960433959961, 0.06672286987304688, 0.06964969635009766, 0.07257652282714844, 0.07550334930419922, 0.07843017578125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 12.0, 448.0, 491.0, 48.0, 10.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.537416458129883, -6.409108638763428, -6.280800819396973, -6.152493476867676, -6.024185657501221, -5.895877838134766, -5.7675700187683105, -5.6392621994018555, -5.510954856872559, -5.3826470375061035, -5.254339218139648, -5.126031875610352, -4.9977240562438965, -4.869416236877441, -4.741108417510986, -4.612800598144531, -4.484493255615234, -4.356185436248779, -4.227877616882324, -4.099570274353027, -3.9712624549865723, -3.842954635620117, -3.714646816253662, -3.586339235305786, -3.458031177520752, -3.329723358154297, -3.201415777206421, -3.073107957839966, -2.94480037689209, -2.8164925575256348, -2.6881847381591797, -2.5598771572113037, -2.431569814682007, -2.3032619953155518, -2.174954414367676, -2.0466465950012207, -1.9183390140533447, -1.7900311946868896, -1.6617234945297241, -1.5334157943725586, -1.405108094215393, -1.2768003940582275, -1.148492693901062, -1.0201849937438965, -0.8918772339820862, -0.7635695338249207, -0.6352617740631104, -0.5069540739059448, -0.3786463737487793, -0.25033867359161377, -0.12203094363212585, 0.0062767863273620605, 0.1345844864845276, 0.2628921866416931, 0.3911999464035034, 0.519507646560669, 0.6478153467178345, 0.776123046875, 0.9044307470321655, 1.032738447189331, 1.1610462665557861, 1.289353847503662, 1.4176616668701172, 1.5459693670272827, 1.6742770671844482]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 10.0, 13.0, 28.0, 57.0, 97.0, 147.0, 164.0, 200.0, 129.0, 82.0, 39.0, 25.0, 13.0, 6.0, 2.0, 0.0, 1.0], "bins": [-2.273683547973633, -2.23122501373291, -2.1887664794921875, -2.146307945251465, -2.103849411010742, -2.0613908767700195, -2.018932342529297, -1.9764736890792847, -1.934015154838562, -1.8915566205978394, -1.8490980863571167, -1.8066394329071045, -1.7641808986663818, -1.7217223644256592, -1.6792638301849365, -1.6368052959442139, -1.5943467617034912, -1.5518882274627686, -1.509429693222046, -1.4669711589813232, -1.424512505531311, -1.3820539712905884, -1.3395954370498657, -1.297136902809143, -1.2546782493591309, -1.2122197151184082, -1.1697611808776855, -1.127302646636963, -1.0848439931869507, -1.042385458946228, -0.9999269247055054, -0.9574683904647827, -0.9150099158287048, -0.8725513815879822, -0.8300927877426147, -0.7876342535018921, -0.7451757192611694, -0.7027171850204468, -0.6602585911750793, -0.6178000569343567, -0.5753414630889893, -0.5328829288482666, -0.49042436480522156, -0.4479658007621765, -0.40550726652145386, -0.3630487024784088, -0.32059013843536377, -0.2781316041946411, -0.23567306995391846, -0.1932145208120346, -0.15075597167015076, -0.10829740762710571, -0.06583885848522186, -0.023380309343338013, 0.01907825469970703, 0.06153678894042969, 0.10399535298347473, 0.14645390212535858, 0.18891245126724243, 0.23137101531028748, 0.2738295793533325, 0.3162881135940552, 0.3587466776371002, 0.4012052118778229, 0.4436637759208679]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 8.0, 7.0, 12.0, 12.0, 14.0, 22.0, 24.0, 31.0, 34.0, 54.0, 59.0, 67.0, 65.0, 470.0, 1046640.0, 642.0, 70.0, 61.0, 74.0, 44.0, 39.0, 25.0, 24.0, 22.0, 7.0, 9.0, 9.0, 7.0, 5.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.49609375, -5.32708740234375, -5.1580810546875, -4.98907470703125, -4.820068359375, -4.65106201171875, -4.4820556640625, -4.31304931640625, -4.14404296875, -3.97503662109375, -3.8060302734375, -3.63702392578125, -3.468017578125, -3.29901123046875, -3.1300048828125, -2.96099853515625, -2.7919921875, -2.62298583984375, -2.4539794921875, -2.28497314453125, -2.115966796875, -1.94696044921875, -1.7779541015625, -1.60894775390625, -1.43994140625, -1.27093505859375, -1.1019287109375, -0.93292236328125, -0.763916015625, -0.59490966796875, -0.4259033203125, -0.25689697265625, -0.087890625, 0.08111572265625, 0.2501220703125, 0.41912841796875, 0.588134765625, 0.75714111328125, 0.9261474609375, 1.09515380859375, 1.26416015625, 1.43316650390625, 1.6021728515625, 1.77117919921875, 1.940185546875, 2.10919189453125, 2.2781982421875, 2.44720458984375, 2.6162109375, 2.78521728515625, 2.9542236328125, 3.12322998046875, 3.292236328125, 3.46124267578125, 3.6302490234375, 3.79925537109375, 3.96826171875, 4.13726806640625, 4.3062744140625, 4.47528076171875, 4.644287109375, 4.81329345703125, 4.9822998046875, 5.15130615234375, 5.3203125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 57.0, 456.0, 455.0, 44.0, 4.0], "bins": [-0.68115234375, -0.6699714660644531, -0.6587905883789062, -0.6476097106933594, -0.6364288330078125, -0.6252479553222656, -0.6140670776367188, -0.6028861999511719, -0.591705322265625, -0.5805244445800781, -0.5693435668945312, -0.5581626892089844, -0.5469818115234375, -0.5358009338378906, -0.5246200561523438, -0.5134391784667969, -0.50225830078125, -0.4910774230957031, -0.47989654541015625, -0.4687156677246094, -0.4575347900390625, -0.4463539123535156, -0.43517303466796875, -0.4239921569824219, -0.412811279296875, -0.4016304016113281, -0.39044952392578125, -0.3792686462402344, -0.3680877685546875, -0.3569068908691406, -0.34572601318359375, -0.3345451354980469, -0.3233642578125, -0.3121833801269531, -0.30100250244140625, -0.2898216247558594, -0.2786407470703125, -0.2674598693847656, -0.25627899169921875, -0.24509811401367188, -0.233917236328125, -0.22273635864257812, -0.21155548095703125, -0.20037460327148438, -0.1891937255859375, -0.17801284790039062, -0.16683197021484375, -0.15565109252929688, -0.14447021484375, -0.13328933715820312, -0.12210845947265625, -0.11092758178710938, -0.0997467041015625, -0.08856582641601562, -0.07738494873046875, -0.06620407104492188, -0.055023193359375, -0.043842315673828125, -0.03266143798828125, -0.021480560302734375, -0.0102996826171875, 0.000881195068359375, 0.01206207275390625, 0.023242950439453125, 0.034423828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 2.0, 13.0, 4.0, 14.0, 25.0, 24.0, 46.0, 51.0, 77.0, 143.0, 197.0, 331.0, 662.0, 1101.0, 2270.0, 4693.0, 10303.0, 25063.0, 72108.0, 256047.0, 447173.0, 150484.0, 46040.0, 17531.0, 7076.0, 3351.0, 1639.0, 875.0, 445.0, 267.0, 178.0, 106.0, 69.0, 38.0, 40.0, 16.0, 12.0, 14.0, 6.0, 10.0, 5.0, 5.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.5947265625, -0.5768661499023438, -0.5590057373046875, -0.5411453247070312, -0.523284912109375, -0.5054244995117188, -0.4875640869140625, -0.46970367431640625, -0.45184326171875, -0.43398284912109375, -0.4161224365234375, -0.39826202392578125, -0.380401611328125, -0.36254119873046875, -0.3446807861328125, -0.32682037353515625, -0.3089599609375, -0.29109954833984375, -0.2732391357421875, -0.25537872314453125, -0.237518310546875, -0.21965789794921875, -0.2017974853515625, -0.18393707275390625, -0.16607666015625, -0.14821624755859375, -0.1303558349609375, -0.11249542236328125, -0.094635009765625, -0.07677459716796875, -0.0589141845703125, -0.04105377197265625, -0.023193359375, -0.00533294677734375, 0.0125274658203125, 0.03038787841796875, 0.048248291015625, 0.06610870361328125, 0.0839691162109375, 0.10182952880859375, 0.11968994140625, 0.13755035400390625, 0.1554107666015625, 0.17327117919921875, 0.191131591796875, 0.20899200439453125, 0.2268524169921875, 0.24471282958984375, 0.2625732421875, 0.28043365478515625, 0.2982940673828125, 0.31615447998046875, 0.334014892578125, 0.35187530517578125, 0.3697357177734375, 0.38759613037109375, 0.40545654296875, 0.42331695556640625, 0.4411773681640625, 0.45903778076171875, 0.476898193359375, 0.49475860595703125, 0.5126190185546875, 0.5304794311523438, 0.54833984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 9.0, 3.0, 12.0, 13.0, 9.0, 21.0, 20.0, 29.0, 49.0, 33.0, 64.0, 44.0, 59.0, 76.0, 54.0, 53.0, 68.0, 56.0, 61.0, 62.0, 33.0, 32.0, 27.0, 29.0, 25.0, 12.0, 11.0, 8.0, 2.0, 3.0, 9.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50927734375, -0.4922332763671875, -0.475189208984375, -0.4581451416015625, -0.44110107421875, -0.4240570068359375, -0.407012939453125, -0.3899688720703125, -0.3729248046875, -0.3558807373046875, -0.338836669921875, -0.3217926025390625, -0.30474853515625, -0.2877044677734375, -0.270660400390625, -0.2536163330078125, -0.236572265625, -0.2195281982421875, -0.202484130859375, -0.1854400634765625, -0.16839599609375, -0.1513519287109375, -0.134307861328125, -0.1172637939453125, -0.1002197265625, -0.0831756591796875, -0.066131591796875, -0.0490875244140625, -0.03204345703125, -0.0149993896484375, 0.002044677734375, 0.0190887451171875, 0.0361328125, 0.0531768798828125, 0.070220947265625, 0.0872650146484375, 0.10430908203125, 0.1213531494140625, 0.138397216796875, 0.1554412841796875, 0.1724853515625, 0.1895294189453125, 0.206573486328125, 0.2236175537109375, 0.24066162109375, 0.2577056884765625, 0.274749755859375, 0.2917938232421875, 0.308837890625, 0.3258819580078125, 0.342926025390625, 0.3599700927734375, 0.37701416015625, 0.3940582275390625, 0.411102294921875, 0.4281463623046875, 0.4451904296875, 0.4622344970703125, 0.479278564453125, 0.4963226318359375, 0.51336669921875, 0.5304107666015625, 0.547454833984375, 0.5644989013671875, 0.58154296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 0.0, 5.0, 5.0, 4.0, 7.0, 14.0, 11.0, 24.0, 41.0, 55.0, 99.0, 180.0, 341.0, 644.0, 1452.0, 3912.0, 15276.0, 114788.0, 758136.0, 129930.0, 16549.0, 4178.0, 1495.0, 646.0, 310.0, 188.0, 86.0, 61.0, 39.0, 15.0, 18.0, 8.0, 8.0, 4.0, 5.0, 5.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98583984375, -0.9555282592773438, -0.9252166748046875, -0.8949050903320312, -0.864593505859375, -0.8342819213867188, -0.8039703369140625, -0.7736587524414062, -0.74334716796875, -0.7130355834960938, -0.6827239990234375, -0.6524124145507812, -0.622100830078125, -0.5917892456054688, -0.5614776611328125, -0.5311660766601562, -0.5008544921875, -0.47054290771484375, -0.4402313232421875, -0.40991973876953125, -0.379608154296875, -0.34929656982421875, -0.3189849853515625, -0.28867340087890625, -0.25836181640625, -0.22805023193359375, -0.1977386474609375, -0.16742706298828125, -0.137115478515625, -0.10680389404296875, -0.0764923095703125, -0.04618072509765625, -0.015869140625, 0.01444244384765625, 0.0447540283203125, 0.07506561279296875, 0.105377197265625, 0.13568878173828125, 0.1660003662109375, 0.19631195068359375, 0.22662353515625, 0.25693511962890625, 0.2872467041015625, 0.31755828857421875, 0.347869873046875, 0.37818145751953125, 0.4084930419921875, 0.43880462646484375, 0.4691162109375, 0.49942779541015625, 0.5297393798828125, 0.5600509643554688, 0.590362548828125, 0.6206741333007812, 0.6509857177734375, 0.6812973022460938, 0.71160888671875, 0.7419204711914062, 0.7722320556640625, 0.8025436401367188, 0.832855224609375, 0.8631668090820312, 0.8934783935546875, 0.9237899780273438, 0.9541015625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 9.0, 12.0, 17.0, 31.0, 39.0, 68.0, 122.0, 146.0, 161.0, 140.0, 86.0, 54.0, 31.0, 20.0, 16.0, 15.0, 8.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012624263763427734, -0.00012233667075634003, -0.00011843070387840271, -0.00011452473700046539, -0.00011061877012252808, -0.00010671280324459076, -0.00010280683636665344, -9.890086948871613e-05, -9.499490261077881e-05, -9.108893573284149e-05, -8.718296885490417e-05, -8.327700197696686e-05, -7.937103509902954e-05, -7.546506822109222e-05, -7.155910134315491e-05, -6.765313446521759e-05, -6.374716758728027e-05, -5.9841200709342957e-05, -5.593523383140564e-05, -5.202926695346832e-05, -4.8123300075531006e-05, -4.421733319759369e-05, -4.031136631965637e-05, -3.6405399441719055e-05, -3.249943256378174e-05, -2.859346568584442e-05, -2.4687498807907104e-05, -2.0781531929969788e-05, -1.687556505203247e-05, -1.2969598174095154e-05, -9.063631296157837e-06, -5.15766441822052e-06, -1.2516975402832031e-06, 2.6542693376541138e-06, 6.560236215591431e-06, 1.0466203093528748e-05, 1.4372169971466064e-05, 1.827813684940338e-05, 2.2184103727340698e-05, 2.6090070605278015e-05, 2.9996037483215332e-05, 3.390200436115265e-05, 3.7807971239089966e-05, 4.171393811702728e-05, 4.56199049949646e-05, 4.9525871872901917e-05, 5.3431838750839233e-05, 5.733780562877655e-05, 6.124377250671387e-05, 6.514973938465118e-05, 6.90557062625885e-05, 7.296167314052582e-05, 7.686764001846313e-05, 8.077360689640045e-05, 8.467957377433777e-05, 8.858554065227509e-05, 9.24915075302124e-05, 9.639747440814972e-05, 0.00010030344128608704, 0.00010420940816402435, 0.00010811537504196167, 0.00011202134191989899, 0.0001159273087978363, 0.00011983327567577362, 0.00012373924255371094]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 6.0, 9.0, 16.0, 19.0, 30.0, 45.0, 59.0, 80.0, 129.0, 272.0, 434.0, 756.0, 1369.0, 2624.0, 5972.0, 17426.0, 94020.0, 726696.0, 161908.0, 22704.0, 7144.0, 3130.0, 1513.0, 887.0, 506.0, 301.0, 178.0, 105.0, 58.0, 56.0, 31.0, 19.0, 9.0, 14.0, 6.0, 9.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0458984375, -1.013824462890625, -0.98175048828125, -0.949676513671875, -0.9176025390625, -0.885528564453125, -0.85345458984375, -0.821380615234375, -0.789306640625, -0.757232666015625, -0.72515869140625, -0.693084716796875, -0.6610107421875, -0.628936767578125, -0.59686279296875, -0.564788818359375, -0.53271484375, -0.500640869140625, -0.46856689453125, -0.436492919921875, -0.4044189453125, -0.372344970703125, -0.34027099609375, -0.308197021484375, -0.276123046875, -0.244049072265625, -0.21197509765625, -0.179901123046875, -0.1478271484375, -0.115753173828125, -0.08367919921875, -0.051605224609375, -0.01953125, 0.012542724609375, 0.04461669921875, 0.076690673828125, 0.1087646484375, 0.140838623046875, 0.17291259765625, 0.204986572265625, 0.237060546875, 0.269134521484375, 0.30120849609375, 0.333282470703125, 0.3653564453125, 0.397430419921875, 0.42950439453125, 0.461578369140625, 0.49365234375, 0.525726318359375, 0.55780029296875, 0.589874267578125, 0.6219482421875, 0.654022216796875, 0.68609619140625, 0.718170166015625, 0.750244140625, 0.782318115234375, 0.81439208984375, 0.846466064453125, 0.8785400390625, 0.910614013671875, 0.94268798828125, 0.974761962890625, 1.0068359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 7.0, 3.0, 5.0, 4.0, 2.0, 12.0, 18.0, 14.0, 26.0, 38.0, 55.0, 87.0, 152.0, 139.0, 130.0, 91.0, 80.0, 51.0, 31.0, 18.0, 13.0, 6.0, 2.0, 8.0, 2.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.38623046875, -0.37176513671875, -0.3572998046875, -0.34283447265625, -0.328369140625, -0.31390380859375, -0.2994384765625, -0.28497314453125, -0.2705078125, -0.25604248046875, -0.2415771484375, -0.22711181640625, -0.212646484375, -0.19818115234375, -0.1837158203125, -0.16925048828125, -0.15478515625, -0.14031982421875, -0.1258544921875, -0.11138916015625, -0.096923828125, -0.08245849609375, -0.0679931640625, -0.05352783203125, -0.0390625, -0.02459716796875, -0.0101318359375, 0.00433349609375, 0.018798828125, 0.03326416015625, 0.0477294921875, 0.06219482421875, 0.07666015625, 0.09112548828125, 0.1055908203125, 0.12005615234375, 0.134521484375, 0.14898681640625, 0.1634521484375, 0.17791748046875, 0.1923828125, 0.20684814453125, 0.2213134765625, 0.23577880859375, 0.250244140625, 0.26470947265625, 0.2791748046875, 0.29364013671875, 0.30810546875, 0.32257080078125, 0.3370361328125, 0.35150146484375, 0.365966796875, 0.38043212890625, 0.3948974609375, 0.40936279296875, 0.423828125, 0.43829345703125, 0.4527587890625, 0.46722412109375, 0.481689453125, 0.49615478515625, 0.5106201171875, 0.52508544921875, 0.53955078125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 15.0, 160.0, 516.0, 233.0, 61.0, 14.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.258275985717773, -23.786636352539062, -23.31499671936035, -22.84335708618164, -22.371719360351562, -21.90007972717285, -21.42844009399414, -20.95680046081543, -20.48516082763672, -20.013521194458008, -19.541881561279297, -19.070241928100586, -18.598604202270508, -18.126964569091797, -17.655324935913086, -17.183685302734375, -16.712045669555664, -16.240406036376953, -15.768767356872559, -15.297127723693848, -14.825488090515137, -14.353849411010742, -13.882209777832031, -13.41057014465332, -12.938931465148926, -12.467291831970215, -11.99565315246582, -11.52401351928711, -11.052373886108398, -10.580734252929688, -10.109095573425293, -9.637455940246582, -9.165816307067871, -8.69417667388916, -8.222537994384766, -7.750898361206055, -7.279258728027344, -6.807619571685791, -6.335980415344238, -5.864340782165527, -5.392701148986816, -4.921061992645264, -4.449422359466553, -3.977783203125, -3.506143569946289, -3.0345044136047363, -2.5628650188446045, -2.0912256240844727, -1.61958646774292, -1.147947072982788, -0.676307737827301, -0.20466840267181396, 0.26697099208831787, 0.7386102676391602, 1.210249662399292, 1.6818890571594238, 2.1535284519195557, 2.6251678466796875, 3.0968072414398193, 3.568446636199951, 4.040085792541504, 4.511725425720215, 4.983364582061768, 5.45500373840332, 5.926643371582031]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 13.0, 17.0, 16.0, 25.0, 29.0, 34.0, 49.0, 48.0, 47.0, 62.0, 56.0, 67.0, 73.0, 67.0, 64.0, 64.0, 55.0, 54.0, 37.0, 29.0, 26.0, 15.0, 14.0, 12.0, 11.0, 9.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.207541465759277, -5.082756042480469, -4.95797061920166, -4.833185195922852, -4.708399295806885, -4.583613872528076, -4.458828449249268, -4.334043025970459, -4.20925760269165, -4.084472179412842, -3.959686517715454, -3.8349010944366455, -3.710115671157837, -3.585330009460449, -3.4605445861816406, -3.335759162902832, -3.2109732627868652, -3.0861878395080566, -2.961402177810669, -2.8366167545318604, -2.7118313312530518, -2.587045669555664, -2.4622602462768555, -2.337474822998047, -2.2126893997192383, -2.0879039764404297, -1.9631184339523315, -1.8383328914642334, -1.7135473489761353, -1.588761806488037, -1.4639763832092285, -1.3391908407211304, -1.2144052982330322, -1.089619755744934, -0.9648342728614807, -0.8400487899780273, -0.7152632474899292, -0.5904777646064758, -0.46569228172302246, -0.3409067392349243, -0.21612125635147095, -0.09133575111627579, 0.03344975411891937, 0.15823525190353394, 0.2830207645893097, 0.40780627727508545, 0.5325917601585388, 0.657377302646637, 0.7821627855300903, 0.9069482684135437, 1.031733751296997, 1.1565192937850952, 1.2813048362731934, 1.406090259552002, 1.5308758020401, 1.6556613445281982, 1.7804467678070068, 1.905232310295105, 2.030017852783203, 2.1548032760620117, 2.2795886993408203, 2.404374361038208, 2.5291597843170166, 2.6539454460144043, 2.778730869293213]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 13.0, 16.0, 26.0, 30.0, 51.0, 49.0, 65.0, 124.0, 168.0, 392.0, 34834.0, 4158048.0, 359.0, 81.0, 19.0, 8.0, 1.0, 2.0], "bins": [-24.578125, -24.148162841796875, -23.71820068359375, -23.288238525390625, -22.8582763671875, -22.428314208984375, -21.99835205078125, -21.568389892578125, -21.138427734375, -20.708465576171875, -20.27850341796875, -19.848541259765625, -19.4185791015625, -18.988616943359375, -18.55865478515625, -18.128692626953125, -17.69873046875, -17.268768310546875, -16.83880615234375, -16.408843994140625, -15.9788818359375, -15.548919677734375, -15.11895751953125, -14.688995361328125, -14.259033203125, -13.829071044921875, -13.39910888671875, -12.969146728515625, -12.5391845703125, -12.109222412109375, -11.67926025390625, -11.249298095703125, -10.8193359375, -10.389373779296875, -9.95941162109375, -9.529449462890625, -9.0994873046875, -8.669525146484375, -8.23956298828125, -7.809600830078125, -7.379638671875, -6.949676513671875, -6.51971435546875, -6.089752197265625, -5.6597900390625, -5.229827880859375, -4.79986572265625, -4.369903564453125, -3.93994140625, -3.509979248046875, -3.08001708984375, -2.650054931640625, -2.2200927734375, -1.790130615234375, -1.36016845703125, -0.930206298828125, -0.500244140625, -0.070281982421875, 0.35968017578125, 0.789642333984375, 1.2196044921875, 1.649566650390625, 2.07952880859375, 2.509490966796875, 2.939453125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 25.0, 90.0, 245.0, 336.0, 215.0, 77.0, 15.0, 2.0, 1.0, 1.0], "bins": [-0.7265625, -0.7138843536376953, -0.7012062072753906, -0.6885280609130859, -0.6758499145507812, -0.6631717681884766, -0.6504936218261719, -0.6378154754638672, -0.6251373291015625, -0.6124591827392578, -0.5997810363769531, -0.5871028900146484, -0.5744247436523438, -0.5617465972900391, -0.5490684509277344, -0.5363903045654297, -0.523712158203125, -0.5110340118408203, -0.4983558654785156, -0.48567771911621094, -0.47299957275390625, -0.46032142639160156, -0.4476432800292969, -0.4349651336669922, -0.4222869873046875, -0.4096088409423828, -0.3969306945800781, -0.38425254821777344, -0.37157440185546875, -0.35889625549316406, -0.3462181091308594, -0.3335399627685547, -0.32086181640625, -0.3081836700439453, -0.2955055236816406, -0.28282737731933594, -0.27014923095703125, -0.25747108459472656, -0.24479293823242188, -0.2321147918701172, -0.2194366455078125, -0.2067584991455078, -0.19408035278320312, -0.18140220642089844, -0.16872406005859375, -0.15604591369628906, -0.14336776733398438, -0.1306896209716797, -0.118011474609375, -0.10533332824707031, -0.09265518188476562, -0.07997703552246094, -0.06729888916015625, -0.05462074279785156, -0.041942596435546875, -0.029264450073242188, -0.0165863037109375, -0.0039081573486328125, 0.008769989013671875, 0.021448135375976562, 0.03412628173828125, 0.04680442810058594, 0.059482574462890625, 0.07216072082519531, 0.0848388671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 4.0, 11.0, 12.0, 18.0, 34.0, 25.0, 26.0, 21.0, 35.0, 49.0, 88.0, 109.0, 136.0, 277.0, 773.0, 9574.0, 4162153.0, 19032.0, 1057.0, 329.0, 157.0, 99.0, 56.0, 36.0, 36.0, 24.0, 22.0, 11.0, 15.0, 12.0, 6.0, 6.0, 4.0, 7.0, 6.0, 0.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.9375, -9.62255859375, -9.3076171875, -8.99267578125, -8.677734375, -8.36279296875, -8.0478515625, -7.73291015625, -7.41796875, -7.10302734375, -6.7880859375, -6.47314453125, -6.158203125, -5.84326171875, -5.5283203125, -5.21337890625, -4.8984375, -4.58349609375, -4.2685546875, -3.95361328125, -3.638671875, -3.32373046875, -3.0087890625, -2.69384765625, -2.37890625, -2.06396484375, -1.7490234375, -1.43408203125, -1.119140625, -0.80419921875, -0.4892578125, -0.17431640625, 0.140625, 0.45556640625, 0.7705078125, 1.08544921875, 1.400390625, 1.71533203125, 2.0302734375, 2.34521484375, 2.66015625, 2.97509765625, 3.2900390625, 3.60498046875, 3.919921875, 4.23486328125, 4.5498046875, 4.86474609375, 5.1796875, 5.49462890625, 5.8095703125, 6.12451171875, 6.439453125, 6.75439453125, 7.0693359375, 7.38427734375, 7.69921875, 8.01416015625, 8.3291015625, 8.64404296875, 8.958984375, 9.27392578125, 9.5888671875, 9.90380859375, 10.21875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 6.0, 27.0, 213.0, 3467.0, 255.0, 72.0, 30.0, 9.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.001953125, -1.9548797607421875, -1.907806396484375, -1.8607330322265625, -1.81365966796875, -1.7665863037109375, -1.719512939453125, -1.6724395751953125, -1.6253662109375, -1.5782928466796875, -1.531219482421875, -1.4841461181640625, -1.43707275390625, -1.3899993896484375, -1.342926025390625, -1.2958526611328125, -1.248779296875, -1.2017059326171875, -1.154632568359375, -1.1075592041015625, -1.06048583984375, -1.0134124755859375, -0.966339111328125, -0.9192657470703125, -0.8721923828125, -0.8251190185546875, -0.778045654296875, -0.7309722900390625, -0.68389892578125, -0.6368255615234375, -0.589752197265625, -0.5426788330078125, -0.49560546875, -0.4485321044921875, -0.401458740234375, -0.3543853759765625, -0.30731201171875, -0.2602386474609375, -0.213165283203125, -0.1660919189453125, -0.1190185546875, -0.0719451904296875, -0.024871826171875, 0.0222015380859375, 0.06927490234375, 0.1163482666015625, 0.163421630859375, 0.2104949951171875, 0.257568359375, 0.3046417236328125, 0.351715087890625, 0.3987884521484375, 0.44586181640625, 0.4929351806640625, 0.540008544921875, 0.5870819091796875, 0.6341552734375, 0.6812286376953125, 0.728302001953125, 0.7753753662109375, 0.82244873046875, 0.8695220947265625, 0.916595458984375, 0.9636688232421875, 1.0107421875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 20.0, 81.0, 428.0, 357.0, 82.0, 22.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.158428192138672, -22.72878074645996, -22.29913330078125, -21.86948585510254, -21.439838409423828, -21.01019287109375, -20.58054542541504, -20.150897979736328, -19.721250534057617, -19.291603088378906, -18.861955642700195, -18.432308197021484, -18.002662658691406, -17.573015213012695, -17.143367767333984, -16.713720321655273, -16.284072875976562, -15.854425430297852, -15.42477798461914, -14.995131492614746, -14.565484046936035, -14.135836601257324, -13.70619010925293, -13.276542663574219, -12.846895217895508, -12.417247772216797, -11.987600326538086, -11.557953834533691, -11.12830638885498, -10.69865894317627, -10.269012451171875, -9.839365005493164, -9.409717559814453, -8.980070114135742, -8.550422668457031, -8.120776176452637, -7.691128730773926, -7.261481285095215, -6.831834316253662, -6.402187347412109, -5.972540378570557, -5.542893409729004, -5.113245964050293, -4.683598518371582, -4.253951549530029, -3.8243043422698975, -3.3946571350097656, -2.965009927749634, -2.535362720489502, -2.10571551322937, -1.6760683059692383, -1.2464210987091064, -0.8167738914489746, -0.3871266841888428, 0.04252052307128906, 0.4721677303314209, 0.9018149375915527, 1.3314621448516846, 1.7611093521118164, 2.1907565593719482, 2.62040376663208, 3.050050973892212, 3.4796981811523438, 3.9093453884124756, 4.338992595672607]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 14.0, 19.0, 36.0, 60.0, 102.0, 112.0, 139.0, 133.0, 114.0, 104.0, 62.0, 46.0, 25.0, 20.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.29947566986084, -5.107267379760742, -4.915058612823486, -4.722850322723389, -4.530641555786133, -4.338433265686035, -4.1462249755859375, -3.9540164470672607, -3.761807918548584, -3.5695993900299072, -3.3773908615112305, -3.185182571411133, -2.992974042892456, -2.8007655143737793, -2.6085572242736816, -2.416348695755005, -2.224140167236328, -2.0319316387176514, -1.8397232294082642, -1.647514820098877, -1.4553062915802002, -1.2630977630615234, -1.0708893537521362, -0.878680944442749, -0.6864724159240723, -0.4942639470100403, -0.3020554780960083, -0.10984700918197632, 0.08236145973205566, 0.27456992864608765, 0.46677839756011963, 0.6589868068695068, 0.8511953353881836, 1.0434038639068604, 1.2356122732162476, 1.4278206825256348, 1.6200292110443115, 1.8122377395629883, 2.004446029663086, 2.1966545581817627, 2.3888630867004395, 2.581071615219116, 2.773280143737793, 2.9654884338378906, 3.1576969623565674, 3.349905490875244, 3.542113780975342, 3.7343223094940186, 3.9265308380126953, 4.118739128112793, 4.310947895050049, 4.5031561851501465, 4.695364952087402, 4.8875732421875, 5.079781532287598, 5.271989822387695, 5.464198589324951, 5.656406879425049, 5.848615646362305, 6.040823936462402, 6.2330322265625, 6.425240993499756, 6.6174492835998535, 6.809658050537109, 7.001866340637207]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 5.0, 15.0, 13.0, 14.0, 16.0, 22.0, 18.0, 30.0, 54.0, 66.0, 131.0, 271.0, 602.0, 1773.0, 10619.0, 213442.0, 786087.0, 30143.0, 3431.0, 910.0, 376.0, 177.0, 84.0, 66.0, 42.0, 18.0, 22.0, 28.0, 14.0, 10.0, 9.0, 6.0, 8.0, 1.0, 5.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -4.004425048828125, -3.88385009765625, -3.763275146484375, -3.6427001953125, -3.522125244140625, -3.40155029296875, -3.280975341796875, -3.160400390625, -3.039825439453125, -2.91925048828125, -2.798675537109375, -2.6781005859375, -2.557525634765625, -2.43695068359375, -2.316375732421875, -2.19580078125, -2.075225830078125, -1.95465087890625, -1.834075927734375, -1.7135009765625, -1.592926025390625, -1.47235107421875, -1.351776123046875, -1.231201171875, -1.110626220703125, -0.99005126953125, -0.869476318359375, -0.7489013671875, -0.628326416015625, -0.50775146484375, -0.387176513671875, -0.2666015625, -0.146026611328125, -0.02545166015625, 0.095123291015625, 0.2156982421875, 0.336273193359375, 0.45684814453125, 0.577423095703125, 0.697998046875, 0.818572998046875, 0.93914794921875, 1.059722900390625, 1.1802978515625, 1.300872802734375, 1.42144775390625, 1.542022705078125, 1.66259765625, 1.783172607421875, 1.90374755859375, 2.024322509765625, 2.1448974609375, 2.265472412109375, 2.38604736328125, 2.506622314453125, 2.627197265625, 2.747772216796875, 2.86834716796875, 2.988922119140625, 3.1094970703125, 3.230072021484375, 3.35064697265625, 3.471221923828125, 3.591796875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 8.0, 16.0, 46.0, 108.0, 155.0, 216.0, 204.0, 123.0, 70.0, 36.0, 14.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.83837890625, -0.8215122222900391, -0.8046455383300781, -0.7877788543701172, -0.7709121704101562, -0.7540454864501953, -0.7371788024902344, -0.7203121185302734, -0.7034454345703125, -0.6865787506103516, -0.6697120666503906, -0.6528453826904297, -0.6359786987304688, -0.6191120147705078, -0.6022453308105469, -0.5853786468505859, -0.568511962890625, -0.5516452789306641, -0.5347785949707031, -0.5179119110107422, -0.5010452270507812, -0.4841785430908203, -0.4673118591308594, -0.45044517517089844, -0.4335784912109375, -0.41671180725097656, -0.3998451232910156, -0.3829784393310547, -0.36611175537109375, -0.3492450714111328, -0.3323783874511719, -0.31551170349121094, -0.29864501953125, -0.28177833557128906, -0.2649116516113281, -0.2480449676513672, -0.23117828369140625, -0.2143115997314453, -0.19744491577148438, -0.18057823181152344, -0.1637115478515625, -0.14684486389160156, -0.12997817993164062, -0.11311149597167969, -0.09624481201171875, -0.07937812805175781, -0.06251144409179688, -0.04564476013183594, -0.028778076171875, -0.011911392211914062, 0.004955291748046875, 0.021821975708007812, 0.03868865966796875, 0.05555534362792969, 0.07242202758789062, 0.08928871154785156, 0.1061553955078125, 0.12302207946777344, 0.13988876342773438, 0.1567554473876953, 0.17362213134765625, 0.1904888153076172, 0.20735549926757812, 0.22422218322753906, 0.2410888671875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 6.0, 9.0, 14.0, 16.0, 33.0, 32.0, 60.0, 100.0, 172.0, 251.0, 485.0, 1140.0, 2706.0, 8327.0, 31301.0, 178281.0, 630747.0, 155328.0, 27435.0, 7464.0, 2424.0, 1008.0, 497.0, 275.0, 151.0, 105.0, 53.0, 44.0, 23.0, 19.0, 17.0, 8.0, 9.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3388671875, -1.2963104248046875, -1.253753662109375, -1.2111968994140625, -1.16864013671875, -1.1260833740234375, -1.083526611328125, -1.0409698486328125, -0.9984130859375, -0.9558563232421875, -0.913299560546875, -0.8707427978515625, -0.82818603515625, -0.7856292724609375, -0.743072509765625, -0.7005157470703125, -0.657958984375, -0.6154022216796875, -0.572845458984375, -0.5302886962890625, -0.48773193359375, -0.4451751708984375, -0.402618408203125, -0.3600616455078125, -0.3175048828125, -0.2749481201171875, -0.232391357421875, -0.1898345947265625, -0.14727783203125, -0.1047210693359375, -0.062164306640625, -0.0196075439453125, 0.02294921875, 0.0655059814453125, 0.108062744140625, 0.1506195068359375, 0.19317626953125, 0.2357330322265625, 0.278289794921875, 0.3208465576171875, 0.3634033203125, 0.4059600830078125, 0.448516845703125, 0.4910736083984375, 0.53363037109375, 0.5761871337890625, 0.618743896484375, 0.6613006591796875, 0.703857421875, 0.7464141845703125, 0.788970947265625, 0.8315277099609375, 0.87408447265625, 0.9166412353515625, 0.959197998046875, 1.0017547607421875, 1.0443115234375, 1.0868682861328125, 1.129425048828125, 1.1719818115234375, 1.21453857421875, 1.2570953369140625, 1.299652099609375, 1.3422088623046875, 1.384765625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 5.0, 6.0, 10.0, 14.0, 14.0, 15.0, 16.0, 28.0, 39.0, 34.0, 45.0, 49.0, 52.0, 65.0, 72.0, 66.0, 66.0, 66.0, 70.0, 61.0, 38.0, 30.0, 25.0, 21.0, 24.0, 13.0, 6.0, 7.0, 7.0, 11.0, 4.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.86328125, -0.8362503051757812, -0.8092193603515625, -0.7821884155273438, -0.755157470703125, -0.7281265258789062, -0.7010955810546875, -0.6740646362304688, -0.64703369140625, -0.6200027465820312, -0.5929718017578125, -0.5659408569335938, -0.538909912109375, -0.5118789672851562, -0.4848480224609375, -0.45781707763671875, -0.4307861328125, -0.40375518798828125, -0.3767242431640625, -0.34969329833984375, -0.322662353515625, -0.29563140869140625, -0.2686004638671875, -0.24156951904296875, -0.21453857421875, -0.18750762939453125, -0.1604766845703125, -0.13344573974609375, -0.106414794921875, -0.07938385009765625, -0.0523529052734375, -0.02532196044921875, 0.001708984375, 0.02873992919921875, 0.0557708740234375, 0.08280181884765625, 0.109832763671875, 0.13686370849609375, 0.1638946533203125, 0.19092559814453125, 0.21795654296875, 0.24498748779296875, 0.2720184326171875, 0.29904937744140625, 0.326080322265625, 0.35311126708984375, 0.3801422119140625, 0.40717315673828125, 0.4342041015625, 0.46123504638671875, 0.4882659912109375, 0.5152969360351562, 0.542327880859375, 0.5693588256835938, 0.5963897705078125, 0.6234207153320312, 0.65045166015625, 0.6774826049804688, 0.7045135498046875, 0.7315444946289062, 0.758575439453125, 0.7856063842773438, 0.8126373291015625, 0.8396682739257812, 0.86669921875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 0.0, 6.0, 4.0, 9.0, 5.0, 4.0, 12.0, 14.0, 24.0, 36.0, 61.0, 75.0, 132.0, 217.0, 478.0, 1234.0, 3504.0, 15711.0, 143892.0, 803007.0, 65926.0, 9822.0, 2598.0, 878.0, 410.0, 190.0, 105.0, 69.0, 39.0, 30.0, 21.0, 14.0, 12.0, 7.0, 4.0, 3.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.099609375, -2.0418548583984375, -1.984100341796875, -1.9263458251953125, -1.86859130859375, -1.8108367919921875, -1.753082275390625, -1.6953277587890625, -1.6375732421875, -1.5798187255859375, -1.522064208984375, -1.4643096923828125, -1.40655517578125, -1.3488006591796875, -1.291046142578125, -1.2332916259765625, -1.175537109375, -1.1177825927734375, -1.060028076171875, -1.0022735595703125, -0.94451904296875, -0.8867645263671875, -0.829010009765625, -0.7712554931640625, -0.7135009765625, -0.6557464599609375, -0.597991943359375, -0.5402374267578125, -0.48248291015625, -0.4247283935546875, -0.366973876953125, -0.3092193603515625, -0.25146484375, -0.1937103271484375, -0.135955810546875, -0.0782012939453125, -0.02044677734375, 0.0373077392578125, 0.095062255859375, 0.1528167724609375, 0.2105712890625, 0.2683258056640625, 0.326080322265625, 0.3838348388671875, 0.44158935546875, 0.4993438720703125, 0.557098388671875, 0.6148529052734375, 0.672607421875, 0.7303619384765625, 0.788116455078125, 0.8458709716796875, 0.90362548828125, 0.9613800048828125, 1.019134521484375, 1.0768890380859375, 1.1346435546875, 1.1923980712890625, 1.250152587890625, 1.3079071044921875, 1.36566162109375, 1.4234161376953125, 1.481170654296875, 1.5389251708984375, 1.5966796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 1.0, 11.0, 8.0, 6.0, 9.0, 18.0, 23.0, 28.0, 63.0, 68.0, 121.0, 151.0, 148.0, 98.0, 85.0, 45.0, 27.0, 19.0, 17.0, 11.0, 13.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00021469593048095703, -0.00020870007574558258, -0.00020270422101020813, -0.00019670836627483368, -0.00019071251153945923, -0.00018471665680408478, -0.00017872080206871033, -0.00017272494733333588, -0.00016672909259796143, -0.00016073323786258698, -0.00015473738312721252, -0.00014874152839183807, -0.00014274567365646362, -0.00013674981892108917, -0.00013075396418571472, -0.00012475810945034027, -0.00011876225471496582, -0.00011276639997959137, -0.00010677054524421692, -0.00010077469050884247, -9.477883577346802e-05, -8.878298103809357e-05, -8.278712630271912e-05, -7.679127156734467e-05, -7.079541683197021e-05, -6.479956209659576e-05, -5.8803707361221313e-05, -5.280785262584686e-05, -4.681199789047241e-05, -4.081614315509796e-05, -3.482028841972351e-05, -2.882443368434906e-05, -2.282857894897461e-05, -1.683272421360016e-05, -1.0836869478225708e-05, -4.841014742851257e-06, 1.1548399925231934e-06, 7.150694727897644e-06, 1.3146549463272095e-05, 1.9142404198646545e-05, 2.5138258934020996e-05, 3.113411366939545e-05, 3.71299684047699e-05, 4.312582314014435e-05, 4.91216778755188e-05, 5.511753261089325e-05, 6.11133873462677e-05, 6.710924208164215e-05, 7.31050968170166e-05, 7.910095155239105e-05, 8.50968062877655e-05, 9.109266102313995e-05, 9.70885157585144e-05, 0.00010308437049388885, 0.0001090802252292633, 0.00011507607996463776, 0.00012107193470001221, 0.00012706778943538666, 0.0001330636441707611, 0.00013905949890613556, 0.00014505535364151, 0.00015105120837688446, 0.0001570470631122589, 0.00016304291784763336, 0.0001690387725830078]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 20.0, 15.0, 20.0, 31.0, 73.0, 102.0, 183.0, 324.0, 621.0, 1286.0, 2705.0, 7162.0, 22691.0, 106383.0, 656037.0, 198886.0, 34708.0, 10211.0, 3815.0, 1633.0, 747.0, 409.0, 191.0, 109.0, 74.0, 28.0, 29.0, 15.0, 11.0, 7.0, 2.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2724609375, -1.22955322265625, -1.1866455078125, -1.14373779296875, -1.100830078125, -1.05792236328125, -1.0150146484375, -0.97210693359375, -0.92919921875, -0.88629150390625, -0.8433837890625, -0.80047607421875, -0.757568359375, -0.71466064453125, -0.6717529296875, -0.62884521484375, -0.5859375, -0.54302978515625, -0.5001220703125, -0.45721435546875, -0.414306640625, -0.37139892578125, -0.3284912109375, -0.28558349609375, -0.24267578125, -0.19976806640625, -0.1568603515625, -0.11395263671875, -0.071044921875, -0.02813720703125, 0.0147705078125, 0.05767822265625, 0.1005859375, 0.14349365234375, 0.1864013671875, 0.22930908203125, 0.272216796875, 0.31512451171875, 0.3580322265625, 0.40093994140625, 0.44384765625, 0.48675537109375, 0.5296630859375, 0.57257080078125, 0.615478515625, 0.65838623046875, 0.7012939453125, 0.74420166015625, 0.787109375, 0.83001708984375, 0.8729248046875, 0.91583251953125, 0.958740234375, 1.00164794921875, 1.0445556640625, 1.08746337890625, 1.13037109375, 1.17327880859375, 1.2161865234375, 1.25909423828125, 1.302001953125, 1.34490966796875, 1.3878173828125, 1.43072509765625, 1.4736328125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 11.0, 17.0, 19.0, 27.0, 31.0, 35.0, 58.0, 52.0, 78.0, 86.0, 89.0, 90.0, 80.0, 74.0, 35.0, 38.0, 41.0, 24.0, 17.0, 25.0, 11.0, 6.0, 6.0, 9.0, 6.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51806640625, -0.50067138671875, -0.4832763671875, -0.46588134765625, -0.448486328125, -0.43109130859375, -0.4136962890625, -0.39630126953125, -0.37890625, -0.36151123046875, -0.3441162109375, -0.32672119140625, -0.309326171875, -0.29193115234375, -0.2745361328125, -0.25714111328125, -0.23974609375, -0.22235107421875, -0.2049560546875, -0.18756103515625, -0.170166015625, -0.15277099609375, -0.1353759765625, -0.11798095703125, -0.1005859375, -0.08319091796875, -0.0657958984375, -0.04840087890625, -0.031005859375, -0.01361083984375, 0.0037841796875, 0.02117919921875, 0.03857421875, 0.05596923828125, 0.0733642578125, 0.09075927734375, 0.108154296875, 0.12554931640625, 0.1429443359375, 0.16033935546875, 0.177734375, 0.19512939453125, 0.2125244140625, 0.22991943359375, 0.247314453125, 0.26470947265625, 0.2821044921875, 0.29949951171875, 0.31689453125, 0.33428955078125, 0.3516845703125, 0.36907958984375, 0.386474609375, 0.40386962890625, 0.4212646484375, 0.43865966796875, 0.4560546875, 0.47344970703125, 0.4908447265625, 0.50823974609375, 0.525634765625, 0.54302978515625, 0.5604248046875, 0.57781982421875, 0.59521484375]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 36.0, 365.0, 540.0, 61.0, 8.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.73247528076172, -35.62472152709961, -34.516971588134766, -33.409217834472656, -32.30146789550781, -31.193714141845703, -30.085960388183594, -28.978208541870117, -27.87045669555664, -26.762704849243164, -25.654953002929688, -24.547199249267578, -23.4394474029541, -22.331695556640625, -21.223941802978516, -20.11618995666504, -19.008438110351562, -17.900686264038086, -16.79293441772461, -15.6851806640625, -14.577428817749023, -13.469676971435547, -12.361924171447754, -11.254171371459961, -10.146419525146484, -9.038667678833008, -7.930914878845215, -6.82316255569458, -5.715410232543945, -4.6076579093933105, -3.499905586242676, -2.392153263092041, -1.2843971252441406, -0.17664480209350586, 0.9311075210571289, 2.0388598442077637, 3.1466121673583984, 4.254364490509033, 5.362116813659668, 6.469869136810303, 7.5776214599609375, 8.685373306274414, 9.793126106262207, 10.90087890625, 12.008630752563477, 13.116382598876953, 14.224135398864746, 15.331888198852539, 16.439640045166016, 17.547391891479492, 18.65514373779297, 19.762897491455078, 20.870649337768555, 21.97840118408203, 23.08615493774414, 24.193906784057617, 25.301658630371094, 26.40941047668457, 27.517162322998047, 28.624916076660156, 29.732667922973633, 30.84041976928711, 31.94817352294922, 33.05592346191406, 34.16367721557617]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 4.0, 8.0, 20.0, 17.0, 24.0, 32.0, 46.0, 53.0, 56.0, 48.0, 55.0, 59.0, 80.0, 67.0, 71.0, 66.0, 46.0, 54.0, 45.0, 31.0, 26.0, 20.0, 16.0, 20.0, 9.0, 12.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.758755683898926, -5.564199924468994, -5.3696441650390625, -5.175087928771973, -4.980532169342041, -4.785976409912109, -4.591420650482178, -4.396864891052246, -4.202308654785156, -4.007752895355225, -3.813196897506714, -3.6186411380767822, -3.4240851402282715, -3.22952938079834, -3.034973621368408, -2.8404178619384766, -2.645862102508545, -2.4513063430786133, -2.2567503452301025, -2.062194585800171, -1.8676387071609497, -1.6730828285217285, -1.4785270690917969, -1.2839711904525757, -1.0894153118133545, -0.8948594331741333, -0.7003036141395569, -0.5057477951049805, -0.3111919164657593, -0.11663603782653809, 0.07791972160339355, 0.27247560024261475, 0.46703147888183594, 0.6615873575210571, 0.8561431765556335, 1.05069899559021, 1.2452548742294312, 1.4398107528686523, 1.634366512298584, 1.8289223909378052, 2.0234782695770264, 2.218034029006958, 2.4125900268554688, 2.6071457862854004, 2.801701545715332, 2.9962575435638428, 3.1908133029937744, 3.385369300842285, 3.579925060272217, 3.7744808197021484, 3.969036817550659, 4.163592338562012, 4.358148574829102, 4.552704334259033, 4.747260093688965, 4.9418158531188965, 5.136371612548828, 5.33092737197876, 5.525483131408691, 5.720039367675781, 5.914595127105713, 6.1091508865356445, 6.303706645965576, 6.498262405395508, 6.692818641662598]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 10.0, 7.0, 13.0, 2.0, 9.0, 9.0, 11.0, 7.0, 29.0, 27.0, 28.0, 41.0, 35.0, 56.0, 102.0, 127.0, 146.0, 300.0, 588.0, 1432.0, 4735.0, 27097.0, 2829949.0, 1293935.0, 27986.0, 5153.0, 1468.0, 510.0, 215.0, 100.0, 60.0, 31.0, 18.0, 11.0, 12.0, 3.0, 4.0, 0.0, 2.0], "bins": [-6.50390625, -6.368377685546875, -6.23284912109375, -6.097320556640625, -5.9617919921875, -5.826263427734375, -5.69073486328125, -5.555206298828125, -5.419677734375, -5.284149169921875, -5.14862060546875, -5.013092041015625, -4.8775634765625, -4.742034912109375, -4.60650634765625, -4.470977783203125, -4.33544921875, -4.199920654296875, -4.06439208984375, -3.928863525390625, -3.7933349609375, -3.657806396484375, -3.52227783203125, -3.386749267578125, -3.251220703125, -3.115692138671875, -2.98016357421875, -2.844635009765625, -2.7091064453125, -2.573577880859375, -2.43804931640625, -2.302520751953125, -2.1669921875, -2.031463623046875, -1.89593505859375, -1.760406494140625, -1.6248779296875, -1.489349365234375, -1.35382080078125, -1.218292236328125, -1.082763671875, -0.947235107421875, -0.81170654296875, -0.676177978515625, -0.5406494140625, -0.405120849609375, -0.26959228515625, -0.134063720703125, 0.00146484375, 0.136993408203125, 0.27252197265625, 0.408050537109375, 0.5435791015625, 0.679107666015625, 0.81463623046875, 0.950164794921875, 1.085693359375, 1.221221923828125, 1.35675048828125, 1.492279052734375, 1.6278076171875, 1.763336181640625, 1.89886474609375, 2.034393310546875, 2.169921875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 12.0, 24.0, 71.0, 109.0, 128.0, 160.0, 169.0, 134.0, 82.0, 47.0, 36.0, 14.0, 8.0, 4.0, 4.0, 1.0, 1.0, 2.0], "bins": [-0.7548828125, -0.7403354644775391, -0.7257881164550781, -0.7112407684326172, -0.6966934204101562, -0.6821460723876953, -0.6675987243652344, -0.6530513763427734, -0.6385040283203125, -0.6239566802978516, -0.6094093322753906, -0.5948619842529297, -0.5803146362304688, -0.5657672882080078, -0.5512199401855469, -0.5366725921630859, -0.522125244140625, -0.5075778961181641, -0.4930305480957031, -0.4784832000732422, -0.46393585205078125, -0.4493885040283203, -0.4348411560058594, -0.42029380798339844, -0.4057464599609375, -0.39119911193847656, -0.3766517639160156, -0.3621044158935547, -0.34755706787109375, -0.3330097198486328, -0.3184623718261719, -0.30391502380371094, -0.28936767578125, -0.27482032775878906, -0.2602729797363281, -0.2457256317138672, -0.23117828369140625, -0.2166309356689453, -0.20208358764648438, -0.18753623962402344, -0.1729888916015625, -0.15844154357910156, -0.14389419555664062, -0.1293468475341797, -0.11479949951171875, -0.10025215148925781, -0.08570480346679688, -0.07115745544433594, -0.056610107421875, -0.04206275939941406, -0.027515411376953125, -0.012968063354492188, 0.00157928466796875, 0.016126632690429688, 0.030673980712890625, 0.04522132873535156, 0.0597686767578125, 0.07431602478027344, 0.08886337280273438, 0.10341072082519531, 0.11795806884765625, 0.1325054168701172, 0.14705276489257812, 0.16160011291503906, 0.1761474609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 12.0, 12.0, 17.0, 26.0, 36.0, 59.0, 81.0, 132.0, 277.0, 642.0, 3438.0, 4136059.0, 51714.0, 1116.0, 316.0, 147.0, 80.0, 49.0, 27.0, 20.0, 14.0, 6.0, 3.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.515625, -18.05029296875, -17.5849609375, -17.11962890625, -16.654296875, -16.18896484375, -15.7236328125, -15.25830078125, -14.79296875, -14.32763671875, -13.8623046875, -13.39697265625, -12.931640625, -12.46630859375, -12.0009765625, -11.53564453125, -11.0703125, -10.60498046875, -10.1396484375, -9.67431640625, -9.208984375, -8.74365234375, -8.2783203125, -7.81298828125, -7.34765625, -6.88232421875, -6.4169921875, -5.95166015625, -5.486328125, -5.02099609375, -4.5556640625, -4.09033203125, -3.625, -3.15966796875, -2.6943359375, -2.22900390625, -1.763671875, -1.29833984375, -0.8330078125, -0.36767578125, 0.09765625, 0.56298828125, 1.0283203125, 1.49365234375, 1.958984375, 2.42431640625, 2.8896484375, 3.35498046875, 3.8203125, 4.28564453125, 4.7509765625, 5.21630859375, 5.681640625, 6.14697265625, 6.6123046875, 7.07763671875, 7.54296875, 8.00830078125, 8.4736328125, 8.93896484375, 9.404296875, 9.86962890625, 10.3349609375, 10.80029296875, 11.265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 24.0, 55.0, 199.0, 3117.0, 503.0, 108.0, 45.0, 10.0, 10.0, 0.0, 5.0], "bins": [-2.6796875, -2.6324539184570312, -2.5852203369140625, -2.5379867553710938, -2.490753173828125, -2.4435195922851562, -2.3962860107421875, -2.3490524291992188, -2.30181884765625, -2.2545852661132812, -2.2073516845703125, -2.1601181030273438, -2.112884521484375, -2.0656509399414062, -2.0184173583984375, -1.9711837768554688, -1.9239501953125, -1.8767166137695312, -1.8294830322265625, -1.7822494506835938, -1.735015869140625, -1.6877822875976562, -1.6405487060546875, -1.5933151245117188, -1.54608154296875, -1.4988479614257812, -1.4516143798828125, -1.4043807983398438, -1.357147216796875, -1.3099136352539062, -1.2626800537109375, -1.2154464721679688, -1.168212890625, -1.1209793090820312, -1.0737457275390625, -1.0265121459960938, -0.979278564453125, -0.9320449829101562, -0.8848114013671875, -0.8375778198242188, -0.79034423828125, -0.7431106567382812, -0.6958770751953125, -0.6486434936523438, -0.601409912109375, -0.5541763305664062, -0.5069427490234375, -0.45970916748046875, -0.4124755859375, -0.36524200439453125, -0.3180084228515625, -0.27077484130859375, -0.223541259765625, -0.17630767822265625, -0.1290740966796875, -0.08184051513671875, -0.03460693359375, 0.01262664794921875, 0.0598602294921875, 0.10709381103515625, 0.154327392578125, 0.20156097412109375, 0.2487945556640625, 0.29602813720703125, 0.34326171875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 9.0, 10.0, 15.0, 61.0, 243.0, 404.0, 186.0, 41.0, 21.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.365792274475098, -14.01054573059082, -13.65530014038086, -13.300053596496582, -12.944807052612305, -12.589561462402344, -12.234314918518066, -11.879068374633789, -11.523822784423828, -11.16857624053955, -10.81333065032959, -10.458084106445312, -10.102837562561035, -9.747591018676758, -9.392345428466797, -9.03709888458252, -8.681852340698242, -8.326605796813965, -7.971359729766846, -7.616113662719727, -7.260867118835449, -6.90562105178833, -6.550374984741211, -6.195128440856934, -5.8398823738098145, -5.484636306762695, -5.129389762878418, -4.774143695831299, -4.41889762878418, -4.063651084899902, -3.708405017852783, -3.353158712387085, -2.997913360595703, -2.642667055130005, -2.2874207496643066, -1.9321746826171875, -1.5769283771514893, -1.221682071685791, -0.8664360046386719, -0.5111896991729736, -0.1559433937072754, 0.19930285215377808, 0.5545490980148315, 0.9097952842712402, 1.2650415897369385, 1.6202878952026367, 1.9755339622497559, 2.330780267715454, 2.6860265731811523, 3.0412728786468506, 3.396519184112549, 3.751765251159668, 4.107011795043945, 4.4622578620910645, 4.817503929138184, 5.172750473022461, 5.52799654006958, 5.883242607116699, 6.238489151000977, 6.593735218048096, 6.948981285095215, 7.304227828979492, 7.659473896026611, 8.01471996307373, 8.369966506958008]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 4.0, 5.0, 14.0, 25.0, 38.0, 49.0, 64.0, 79.0, 124.0, 115.0, 109.0, 91.0, 95.0, 67.0, 45.0, 30.0, 21.0, 10.0, 10.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.531558990478516, -5.361130714416504, -5.190702438354492, -5.0202741622924805, -4.8498454093933105, -4.679417133331299, -4.508988857269287, -4.338560581207275, -4.1681318283081055, -3.9977035522460938, -3.827275037765503, -3.656846761703491, -3.4864182472229004, -3.3159899711608887, -3.145561695098877, -2.9751334190368652, -2.8047051429748535, -2.634276866912842, -2.463848352432251, -2.2934200763702393, -2.1229915618896484, -1.9525632858276367, -1.782135009765625, -1.6117066144943237, -1.4412782192230225, -1.2708498239517212, -1.10042142868042, -0.9299931526184082, -0.7595647573471069, -0.5891363620758057, -0.41870808601379395, -0.24827969074249268, -0.0778508186340332, 0.09257754683494568, 0.26300591230392456, 0.43343424797058105, 0.6038626432418823, 0.7742910385131836, 0.9447193145751953, 1.1151477098464966, 1.2855761051177979, 1.4560045003890991, 1.6264328956604004, 1.796861171722412, 1.9672895669937134, 2.1377179622650146, 2.3081462383270264, 2.478574752807617, 2.649003028869629, 2.8194313049316406, 2.9898598194122314, 3.160288095474243, 3.330716609954834, 3.5011448860168457, 3.6715731620788574, 3.842001438140869, 4.012430191040039, 4.182858467102051, 4.3532867431640625, 4.523715019226074, 4.694143772125244, 4.864572048187256, 5.035000324249268, 5.205428600311279, 5.375856876373291]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 9.0, 4.0, 9.0, 7.0, 16.0, 16.0, 24.0, 30.0, 54.0, 58.0, 94.0, 133.0, 227.0, 372.0, 745.0, 1708.0, 6225.0, 35079.0, 513543.0, 449224.0, 31980.0, 5648.0, 1679.0, 679.0, 331.0, 218.0, 133.0, 81.0, 56.0, 40.0, 34.0, 18.0, 22.0, 16.0, 6.0, 8.0, 6.0, 4.0, 5.0, 5.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.203125, -3.088623046875, -2.97412109375, -2.859619140625, -2.7451171875, -2.630615234375, -2.51611328125, -2.401611328125, -2.287109375, -2.172607421875, -2.05810546875, -1.943603515625, -1.8291015625, -1.714599609375, -1.60009765625, -1.485595703125, -1.37109375, -1.256591796875, -1.14208984375, -1.027587890625, -0.9130859375, -0.798583984375, -0.68408203125, -0.569580078125, -0.455078125, -0.340576171875, -0.22607421875, -0.111572265625, 0.0029296875, 0.117431640625, 0.23193359375, 0.346435546875, 0.4609375, 0.575439453125, 0.68994140625, 0.804443359375, 0.9189453125, 1.033447265625, 1.14794921875, 1.262451171875, 1.376953125, 1.491455078125, 1.60595703125, 1.720458984375, 1.8349609375, 1.949462890625, 2.06396484375, 2.178466796875, 2.29296875, 2.407470703125, 2.52197265625, 2.636474609375, 2.7509765625, 2.865478515625, 2.97998046875, 3.094482421875, 3.208984375, 3.323486328125, 3.43798828125, 3.552490234375, 3.6669921875, 3.781494140625, 3.89599609375, 4.010498046875, 4.125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 26.0, 71.0, 76.0, 98.0, 147.0, 138.0, 127.0, 109.0, 88.0, 39.0, 29.0, 19.0, 11.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.8167076110839844, -0.7974777221679688, -0.7782478332519531, -0.7590179443359375, -0.7397880554199219, -0.7205581665039062, -0.7013282775878906, -0.682098388671875, -0.6628684997558594, -0.6436386108398438, -0.6244087219238281, -0.6051788330078125, -0.5859489440917969, -0.5667190551757812, -0.5474891662597656, -0.52825927734375, -0.5090293884277344, -0.48979949951171875, -0.4705696105957031, -0.4513397216796875, -0.4321098327636719, -0.41287994384765625, -0.3936500549316406, -0.374420166015625, -0.3551902770996094, -0.33596038818359375, -0.3167304992675781, -0.2975006103515625, -0.2782707214355469, -0.25904083251953125, -0.23981094360351562, -0.2205810546875, -0.20135116577148438, -0.18212127685546875, -0.16289138793945312, -0.1436614990234375, -0.12443161010742188, -0.10520172119140625, -0.08597183227539062, -0.066741943359375, -0.047512054443359375, -0.02828216552734375, -0.009052276611328125, 0.0101776123046875, 0.029407501220703125, 0.04863739013671875, 0.06786727905273438, 0.08709716796875, 0.10632705688476562, 0.12555694580078125, 0.14478683471679688, 0.1640167236328125, 0.18324661254882812, 0.20247650146484375, 0.22170639038085938, 0.240936279296875, 0.2601661682128906, 0.27939605712890625, 0.2986259460449219, 0.3178558349609375, 0.3370857238769531, 0.35631561279296875, 0.3755455017089844, 0.394775390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 1.0, 6.0, 4.0, 4.0, 14.0, 16.0, 18.0, 23.0, 32.0, 42.0, 67.0, 81.0, 137.0, 212.0, 321.0, 548.0, 1094.0, 2000.0, 4087.0, 9476.0, 26716.0, 92605.0, 374210.0, 391712.0, 98182.0, 27773.0, 10042.0, 4311.0, 2001.0, 1159.0, 615.0, 378.0, 249.0, 136.0, 92.0, 51.0, 37.0, 31.0, 18.0, 13.0, 13.0, 14.0, 2.0, 3.0, 7.0, 3.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2998046875, -1.257904052734375, -1.21600341796875, -1.174102783203125, -1.1322021484375, -1.090301513671875, -1.04840087890625, -1.006500244140625, -0.964599609375, -0.922698974609375, -0.88079833984375, -0.838897705078125, -0.7969970703125, -0.755096435546875, -0.71319580078125, -0.671295166015625, -0.62939453125, -0.587493896484375, -0.54559326171875, -0.503692626953125, -0.4617919921875, -0.419891357421875, -0.37799072265625, -0.336090087890625, -0.294189453125, -0.252288818359375, -0.21038818359375, -0.168487548828125, -0.1265869140625, -0.084686279296875, -0.04278564453125, -0.000885009765625, 0.041015625, 0.082916259765625, 0.12481689453125, 0.166717529296875, 0.2086181640625, 0.250518798828125, 0.29241943359375, 0.334320068359375, 0.376220703125, 0.418121337890625, 0.46002197265625, 0.501922607421875, 0.5438232421875, 0.585723876953125, 0.62762451171875, 0.669525146484375, 0.71142578125, 0.753326416015625, 0.79522705078125, 0.837127685546875, 0.8790283203125, 0.920928955078125, 0.96282958984375, 1.004730224609375, 1.046630859375, 1.088531494140625, 1.13043212890625, 1.172332763671875, 1.2142333984375, 1.256134033203125, 1.29803466796875, 1.339935302734375, 1.3818359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 5.0, 0.0, 3.0, 4.0, 7.0, 11.0, 13.0, 17.0, 27.0, 18.0, 23.0, 34.0, 36.0, 37.0, 51.0, 50.0, 54.0, 63.0, 76.0, 63.0, 55.0, 39.0, 46.0, 46.0, 41.0, 41.0, 25.0, 38.0, 14.0, 11.0, 16.0, 15.0, 3.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.059417724609375, -1.02117919921875, -0.982940673828125, -0.9447021484375, -0.906463623046875, -0.86822509765625, -0.829986572265625, -0.791748046875, -0.753509521484375, -0.71527099609375, -0.677032470703125, -0.6387939453125, -0.600555419921875, -0.56231689453125, -0.524078369140625, -0.48583984375, -0.447601318359375, -0.40936279296875, -0.371124267578125, -0.3328857421875, -0.294647216796875, -0.25640869140625, -0.218170166015625, -0.179931640625, -0.141693115234375, -0.10345458984375, -0.065216064453125, -0.0269775390625, 0.011260986328125, 0.04949951171875, 0.087738037109375, 0.1259765625, 0.164215087890625, 0.20245361328125, 0.240692138671875, 0.2789306640625, 0.317169189453125, 0.35540771484375, 0.393646240234375, 0.431884765625, 0.470123291015625, 0.50836181640625, 0.546600341796875, 0.5848388671875, 0.623077392578125, 0.66131591796875, 0.699554443359375, 0.73779296875, 0.776031494140625, 0.81427001953125, 0.852508544921875, 0.8907470703125, 0.928985595703125, 0.96722412109375, 1.005462646484375, 1.043701171875, 1.081939697265625, 1.12017822265625, 1.158416748046875, 1.1966552734375, 1.234893798828125, 1.27313232421875, 1.311370849609375, 1.349609375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 7.0, 2.0, 3.0, 7.0, 6.0, 11.0, 16.0, 29.0, 52.0, 89.0, 194.0, 469.0, 1245.0, 4736.0, 24290.0, 702415.0, 295151.0, 14772.0, 3305.0, 1022.0, 367.0, 170.0, 71.0, 40.0, 29.0, 21.0, 13.0, 4.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.064453125, -2.003509521484375, -1.94256591796875, -1.881622314453125, -1.8206787109375, -1.759735107421875, -1.69879150390625, -1.637847900390625, -1.576904296875, -1.515960693359375, -1.45501708984375, -1.394073486328125, -1.3331298828125, -1.272186279296875, -1.21124267578125, -1.150299072265625, -1.08935546875, -1.028411865234375, -0.96746826171875, -0.906524658203125, -0.8455810546875, -0.784637451171875, -0.72369384765625, -0.662750244140625, -0.601806640625, -0.540863037109375, -0.47991943359375, -0.418975830078125, -0.3580322265625, -0.297088623046875, -0.23614501953125, -0.175201416015625, -0.1142578125, -0.053314208984375, 0.00762939453125, 0.068572998046875, 0.1295166015625, 0.190460205078125, 0.25140380859375, 0.312347412109375, 0.373291015625, 0.434234619140625, 0.49517822265625, 0.556121826171875, 0.6170654296875, 0.678009033203125, 0.73895263671875, 0.799896240234375, 0.86083984375, 0.921783447265625, 0.98272705078125, 1.043670654296875, 1.1046142578125, 1.165557861328125, 1.22650146484375, 1.287445068359375, 1.348388671875, 1.409332275390625, 1.47027587890625, 1.531219482421875, 1.5921630859375, 1.653106689453125, 1.71405029296875, 1.774993896484375, 1.8359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 12.0, 25.0, 29.0, 41.0, 76.0, 105.0, 154.0, 178.0, 133.0, 77.0, 53.0, 31.0, 27.0, 17.0, 10.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0002040863037109375, -0.00019684433937072754, -0.00018960237503051758, -0.00018236041069030762, -0.00017511844635009766, -0.0001678764820098877, -0.00016063451766967773, -0.00015339255332946777, -0.0001461505889892578, -0.00013890862464904785, -0.0001316666603088379, -0.00012442469596862793, -0.00011718273162841797, -0.00010994076728820801, -0.00010269880294799805, -9.545683860778809e-05, -8.821487426757812e-05, -8.097290992736816e-05, -7.37309455871582e-05, -6.648898124694824e-05, -5.924701690673828e-05, -5.200505256652832e-05, -4.476308822631836e-05, -3.75211238861084e-05, -3.0279159545898438e-05, -2.3037195205688477e-05, -1.5795230865478516e-05, -8.553266525268555e-06, -1.3113021850585938e-06, 5.930662155151367e-06, 1.3172626495361328e-05, 2.041459083557129e-05, 2.765655517578125e-05, 3.489851951599121e-05, 4.214048385620117e-05, 4.938244819641113e-05, 5.6624412536621094e-05, 6.386637687683105e-05, 7.110834121704102e-05, 7.835030555725098e-05, 8.559226989746094e-05, 9.28342342376709e-05, 0.00010007619857788086, 0.00010731816291809082, 0.00011456012725830078, 0.00012180209159851074, 0.0001290440559387207, 0.00013628602027893066, 0.00014352798461914062, 0.00015076994895935059, 0.00015801191329956055, 0.0001652538776397705, 0.00017249584197998047, 0.00017973780632019043, 0.0001869797706604004, 0.00019422173500061035, 0.0002014636993408203, 0.00020870566368103027, 0.00021594762802124023, 0.0002231895923614502, 0.00023043155670166016, 0.00023767352104187012, 0.0002449154853820801, 0.00025215744972229004, 0.0002593994140625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 11.0, 14.0, 21.0, 33.0, 56.0, 99.0, 162.0, 347.0, 890.0, 2182.0, 6932.0, 33801.0, 572090.0, 396638.0, 25995.0, 5861.0, 1893.0, 786.0, 392.0, 160.0, 89.0, 38.0, 22.0, 11.0, 11.0, 10.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3994140625, -1.3493194580078125, -1.299224853515625, -1.2491302490234375, -1.19903564453125, -1.1489410400390625, -1.098846435546875, -1.0487518310546875, -0.9986572265625, -0.9485626220703125, -0.898468017578125, -0.8483734130859375, -0.79827880859375, -0.7481842041015625, -0.698089599609375, -0.6479949951171875, -0.597900390625, -0.5478057861328125, -0.497711181640625, -0.4476165771484375, -0.39752197265625, -0.3474273681640625, -0.297332763671875, -0.2472381591796875, -0.1971435546875, -0.1470489501953125, -0.096954345703125, -0.0468597412109375, 0.00323486328125, 0.0533294677734375, 0.103424072265625, 0.1535186767578125, 0.20361328125, 0.2537078857421875, 0.303802490234375, 0.3538970947265625, 0.40399169921875, 0.4540863037109375, 0.504180908203125, 0.5542755126953125, 0.6043701171875, 0.6544647216796875, 0.704559326171875, 0.7546539306640625, 0.80474853515625, 0.8548431396484375, 0.904937744140625, 0.9550323486328125, 1.005126953125, 1.0552215576171875, 1.105316162109375, 1.1554107666015625, 1.20550537109375, 1.2555999755859375, 1.305694580078125, 1.3557891845703125, 1.4058837890625, 1.4559783935546875, 1.506072998046875, 1.5561676025390625, 1.60626220703125, 1.6563568115234375, 1.706451416015625, 1.7565460205078125, 1.806640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 8.0, 8.0, 17.0, 17.0, 22.0, 34.0, 52.0, 51.0, 76.0, 93.0, 121.0, 113.0, 96.0, 77.0, 59.0, 40.0, 17.0, 30.0, 14.0, 12.0, 12.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52392578125, -0.5051040649414062, -0.4862823486328125, -0.46746063232421875, -0.448638916015625, -0.42981719970703125, -0.4109954833984375, -0.39217376708984375, -0.37335205078125, -0.35453033447265625, -0.3357086181640625, -0.31688690185546875, -0.298065185546875, -0.27924346923828125, -0.2604217529296875, -0.24160003662109375, -0.2227783203125, -0.20395660400390625, -0.1851348876953125, -0.16631317138671875, -0.147491455078125, -0.12866973876953125, -0.1098480224609375, -0.09102630615234375, -0.07220458984375, -0.05338287353515625, -0.0345611572265625, -0.01573944091796875, 0.003082275390625, 0.02190399169921875, 0.0407257080078125, 0.05954742431640625, 0.078369140625, 0.09719085693359375, 0.1160125732421875, 0.13483428955078125, 0.153656005859375, 0.17247772216796875, 0.1912994384765625, 0.21012115478515625, 0.22894287109375, 0.24776458740234375, 0.2665863037109375, 0.28540802001953125, 0.304229736328125, 0.32305145263671875, 0.3418731689453125, 0.36069488525390625, 0.3795166015625, 0.39833831787109375, 0.4171600341796875, 0.43598175048828125, 0.454803466796875, 0.47362518310546875, 0.4924468994140625, 0.5112686157226562, 0.53009033203125, 0.5489120483398438, 0.5677337646484375, 0.5865554809570312, 0.605377197265625, 0.6241989135742188, 0.6430206298828125, 0.6618423461914062, 0.6806640625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 1.0, 10.0, 20.0, 26.0, 53.0, 135.0, 217.0, 224.0, 156.0, 84.0, 39.0, 15.0, 12.0, 8.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.674236297607422, -20.25298500061035, -19.83173370361328, -19.41048240661621, -18.98923110961914, -18.567977905273438, -18.146726608276367, -17.725475311279297, -17.304224014282227, -16.882972717285156, -16.461721420288086, -16.040470123291016, -15.619217872619629, -15.197966575622559, -14.776714324951172, -14.355463027954102, -13.934211730957031, -13.512960433959961, -13.09170913696289, -12.670456886291504, -12.249205589294434, -11.827954292297363, -11.406702041625977, -10.985450744628906, -10.564199447631836, -10.142948150634766, -9.721696853637695, -9.300444602966309, -8.879193305969238, -8.457942008972168, -8.036689758300781, -7.615438461303711, -7.194188117980957, -6.772936820983887, -6.351685047149658, -5.93043327331543, -5.509181976318359, -5.087930679321289, -4.6666789054870605, -4.245427131652832, -3.8241758346557617, -3.4029242992401123, -2.981672763824463, -2.5604212284088135, -2.139169692993164, -1.7179181575775146, -1.2966666221618652, -0.8754150867462158, -0.4541635513305664, -0.03291201591491699, 0.3883395195007324, 0.8095910549163818, 1.2308425903320312, 1.6520941257476807, 2.07334566116333, 2.4945971965789795, 2.915848731994629, 3.3371002674102783, 3.7583518028259277, 4.179603576660156, 4.600854873657227, 5.022106170654297, 5.443357944488525, 5.864609718322754, 6.285861015319824]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 8.0, 7.0, 6.0, 14.0, 12.0, 21.0, 23.0, 27.0, 21.0, 31.0, 43.0, 36.0, 55.0, 38.0, 48.0, 59.0, 57.0, 48.0, 51.0, 40.0, 56.0, 41.0, 37.0, 32.0, 32.0, 25.0, 24.0, 19.0, 18.0, 18.0, 8.0, 12.0, 7.0, 4.0, 4.0, 1.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.928624153137207, -4.746648788452148, -4.56467342376709, -4.382698059082031, -4.200722694396973, -4.018747329711914, -3.8367722034454346, -3.654796838760376, -3.4728214740753174, -3.290846109390259, -3.1088707447052, -2.9268956184387207, -2.744920253753662, -2.5629448890686035, -2.380969524383545, -2.1989941596984863, -2.0170187950134277, -1.8350434303283691, -1.6530680656433105, -1.4710928201675415, -1.289117455482483, -1.1071420907974243, -0.9251668453216553, -0.7431914806365967, -0.5612161159515381, -0.3792407810688019, -0.19726544618606567, -0.015290141105651855, 0.16668522357940674, 0.34866058826446533, 0.5306358337402344, 0.712611198425293, 0.8945860862731934, 1.076561450958252, 1.2585368156433105, 1.4405120611190796, 1.6224874258041382, 1.8044627904891968, 1.9864380359649658, 2.1684134006500244, 2.350388765335083, 2.5323641300201416, 2.7143394947052, 2.8963146209716797, 3.0782899856567383, 3.260265350341797, 3.4422407150268555, 3.624216079711914, 3.8061914443969727, 3.9881668090820312, 4.17014217376709, 4.352117538452148, 4.534092903137207, 4.716068267822266, 4.898043632507324, 5.080018997192383, 5.261994361877441, 5.4439697265625, 5.625945091247559, 5.807920455932617, 5.989895820617676, 6.171871185302734, 6.353846549987793, 6.535821914672852, 6.717796802520752]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 4.0, 11.0, 11.0, 23.0, 31.0, 60.0, 108.0, 176.0, 368.0, 729.0, 3663.0, 59629.0, 4104051.0, 22282.0, 2201.0, 558.0, 204.0, 81.0, 42.0, 15.0, 13.0, 5.0, 9.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4140625, -9.1807861328125, -8.947509765625, -8.7142333984375, -8.48095703125, -8.2476806640625, -8.014404296875, -7.7811279296875, -7.5478515625, -7.3145751953125, -7.081298828125, -6.8480224609375, -6.61474609375, -6.3814697265625, -6.148193359375, -5.9149169921875, -5.681640625, -5.4483642578125, -5.215087890625, -4.9818115234375, -4.74853515625, -4.5152587890625, -4.281982421875, -4.0487060546875, -3.8154296875, -3.5821533203125, -3.348876953125, -3.1156005859375, -2.88232421875, -2.6490478515625, -2.415771484375, -2.1824951171875, -1.94921875, -1.7159423828125, -1.482666015625, -1.2493896484375, -1.01611328125, -0.7828369140625, -0.549560546875, -0.3162841796875, -0.0830078125, 0.1502685546875, 0.383544921875, 0.6168212890625, 0.85009765625, 1.0833740234375, 1.316650390625, 1.5499267578125, 1.783203125, 2.0164794921875, 2.249755859375, 2.4830322265625, 2.71630859375, 2.9495849609375, 3.182861328125, 3.4161376953125, 3.6494140625, 3.8826904296875, 4.115966796875, 4.3492431640625, 4.58251953125, 4.8157958984375, 5.049072265625, 5.2823486328125, 5.515625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 9.0, 12.0, 21.0, 37.0, 61.0, 87.0, 105.0, 121.0, 114.0, 112.0, 105.0, 76.0, 62.0, 34.0, 21.0, 12.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.84033203125, -0.8222274780273438, -0.8041229248046875, -0.7860183715820312, -0.767913818359375, -0.7498092651367188, -0.7317047119140625, -0.7136001586914062, -0.69549560546875, -0.6773910522460938, -0.6592864990234375, -0.6411819458007812, -0.623077392578125, -0.6049728393554688, -0.5868682861328125, -0.5687637329101562, -0.5506591796875, -0.5325546264648438, -0.5144500732421875, -0.49634552001953125, -0.478240966796875, -0.46013641357421875, -0.4420318603515625, -0.42392730712890625, -0.40582275390625, -0.38771820068359375, -0.3696136474609375, -0.35150909423828125, -0.333404541015625, -0.31529998779296875, -0.2971954345703125, -0.27909088134765625, -0.260986328125, -0.24288177490234375, -0.2247772216796875, -0.20667266845703125, -0.188568115234375, -0.17046356201171875, -0.1523590087890625, -0.13425445556640625, -0.11614990234375, -0.09804534912109375, -0.0799407958984375, -0.06183624267578125, -0.043731689453125, -0.02562713623046875, -0.0075225830078125, 0.01058197021484375, 0.0286865234375, 0.04679107666015625, 0.0648956298828125, 0.08300018310546875, 0.101104736328125, 0.11920928955078125, 0.1373138427734375, 0.15541839599609375, 0.17352294921875, 0.19162750244140625, 0.2097320556640625, 0.22783660888671875, 0.245941162109375, 0.26404571533203125, 0.2821502685546875, 0.30025482177734375, 0.318359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 10.0, 22.0, 36.0, 56.0, 97.0, 152.0, 329.0, 614.0, 1362.0, 4104.0, 24199.0, 3725138.0, 417574.0, 15424.0, 3072.0, 1086.0, 487.0, 231.0, 129.0, 56.0, 31.0, 28.0, 15.0, 2.0, 8.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.328125, -5.191131591796875, -5.05413818359375, -4.917144775390625, -4.7801513671875, -4.643157958984375, -4.50616455078125, -4.369171142578125, -4.232177734375, -4.095184326171875, -3.95819091796875, -3.821197509765625, -3.6842041015625, -3.547210693359375, -3.41021728515625, -3.273223876953125, -3.13623046875, -2.999237060546875, -2.86224365234375, -2.725250244140625, -2.5882568359375, -2.451263427734375, -2.31427001953125, -2.177276611328125, -2.040283203125, -1.903289794921875, -1.76629638671875, -1.629302978515625, -1.4923095703125, -1.355316162109375, -1.21832275390625, -1.081329345703125, -0.9443359375, -0.807342529296875, -0.67034912109375, -0.533355712890625, -0.3963623046875, -0.259368896484375, -0.12237548828125, 0.014617919921875, 0.151611328125, 0.288604736328125, 0.42559814453125, 0.562591552734375, 0.6995849609375, 0.836578369140625, 0.97357177734375, 1.110565185546875, 1.24755859375, 1.384552001953125, 1.52154541015625, 1.658538818359375, 1.7955322265625, 1.932525634765625, 2.06951904296875, 2.206512451171875, 2.343505859375, 2.480499267578125, 2.61749267578125, 2.754486083984375, 2.8914794921875, 3.028472900390625, 3.16546630859375, 3.302459716796875, 3.439453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 11.0, 11.0, 24.0, 37.0, 80.0, 185.0, 1330.0, 2038.0, 178.0, 71.0, 46.0, 28.0, 11.0, 7.0, 11.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98095703125, -0.9529647827148438, -0.9249725341796875, -0.8969802856445312, -0.868988037109375, -0.8409957885742188, -0.8130035400390625, -0.7850112915039062, -0.75701904296875, -0.7290267944335938, -0.7010345458984375, -0.6730422973632812, -0.645050048828125, -0.6170578002929688, -0.5890655517578125, -0.5610733032226562, -0.5330810546875, -0.5050888061523438, -0.4770965576171875, -0.44910430908203125, -0.421112060546875, -0.39311981201171875, -0.3651275634765625, -0.33713531494140625, -0.30914306640625, -0.28115081787109375, -0.2531585693359375, -0.22516632080078125, -0.197174072265625, -0.16918182373046875, -0.1411895751953125, -0.11319732666015625, -0.085205078125, -0.05721282958984375, -0.0292205810546875, -0.00122833251953125, 0.026763916015625, 0.05475616455078125, 0.0827484130859375, 0.11074066162109375, 0.13873291015625, 0.16672515869140625, 0.1947174072265625, 0.22270965576171875, 0.250701904296875, 0.27869415283203125, 0.3066864013671875, 0.33467864990234375, 0.3626708984375, 0.39066314697265625, 0.4186553955078125, 0.44664764404296875, 0.474639892578125, 0.5026321411132812, 0.5306243896484375, 0.5586166381835938, 0.58660888671875, 0.6146011352539062, 0.6425933837890625, 0.6705856323242188, 0.698577880859375, 0.7265701293945312, 0.7545623779296875, 0.7825546264648438, 0.810546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 11.0, 13.0, 70.0, 225.0, 356.0, 212.0, 77.0, 26.0, 6.0, 7.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.263915538787842, -6.028168201446533, -5.792420864105225, -5.556673526763916, -5.320925712585449, -5.085178375244141, -4.849431037902832, -4.613683700561523, -4.377936363220215, -4.142189025878906, -3.9064416885375977, -3.67069411277771, -3.4349467754364014, -3.1991994380950928, -2.963451862335205, -2.7277045249938965, -2.491957187652588, -2.2562098503112793, -2.0204625129699707, -1.784714937210083, -1.5489675998687744, -1.3132202625274658, -1.0774728059768677, -0.8417253494262695, -0.6059780120849609, -0.37023061513900757, -0.1344832181930542, 0.10126417875289917, 0.33701157569885254, 0.5727589130401611, 0.8085063695907593, 1.0442538261413574, 1.2800006866455078, 1.5157480239868164, 1.7514954805374146, 1.9872429370880127, 2.2229902744293213, 2.45873761177063, 2.6944851875305176, 2.930232524871826, 3.1659798622131348, 3.4017271995544434, 3.637474536895752, 3.8732221126556396, 4.108969688415527, 4.344717025756836, 4.5804643630981445, 4.816211700439453, 5.051959037780762, 5.28770637512207, 5.523453712463379, 5.7592010498046875, 5.994948387145996, 6.230695724487305, 6.4664435386657715, 6.70219087600708, 6.937938213348389, 7.173685550689697, 7.409432888031006, 7.6451802253723145, 7.880928039550781, 8.11667537689209, 8.352422714233398, 8.588170051574707, 8.823917388916016]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 13.0, 11.0, 18.0, 25.0, 25.0, 35.0, 40.0, 58.0, 65.0, 77.0, 70.0, 70.0, 81.0, 52.0, 67.0, 56.0, 61.0, 36.0, 41.0, 29.0, 15.0, 16.0, 7.0, 7.0, 8.0, 8.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.111163377761841, -3.0283901691436768, -2.9456169605255127, -2.8628437519073486, -2.7800705432891846, -2.6972973346710205, -2.6145241260528564, -2.5317511558532715, -2.4489779472351074, -2.3662047386169434, -2.2834315299987793, -2.2006583213806152, -2.117885112762451, -2.035111904144287, -1.9523388147354126, -1.8695656061172485, -1.786792278289795, -1.7040190696716309, -1.6212458610534668, -1.5384726524353027, -1.4556994438171387, -1.3729262351989746, -1.2901531457901, -1.207379937171936, -1.124606728553772, -1.041833519935608, -0.9590603113174438, -0.8762871623039246, -0.7935139536857605, -0.7107407450675964, -0.6279675960540771, -0.5451943874359131, -0.462421178817749, -0.37964797019958496, -0.2968747913837433, -0.21410159766674042, -0.13132840394973755, -0.048555195331573486, 0.03421798348426819, 0.11699116230010986, 0.19976437091827393, 0.282537579536438, 0.36531075835227966, 0.44808393716812134, 0.5308571457862854, 0.6136303544044495, 0.6964035034179688, 0.7791767120361328, 0.8619499206542969, 0.9447231292724609, 1.027496337890625, 1.110269546508789, 1.1930427551269531, 1.2758159637451172, 1.3585890531539917, 1.4413622617721558, 1.5241354703903198, 1.6069086790084839, 1.689681887626648, 1.772455096244812, 1.8552281856536865, 1.9380013942718506, 2.0207746028900146, 2.1035478115081787, 2.1863210201263428]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 11.0, 10.0, 11.0, 19.0, 32.0, 41.0, 68.0, 111.0, 177.0, 397.0, 821.0, 2335.0, 11703.0, 147836.0, 798045.0, 75835.0, 7786.0, 1893.0, 635.0, 327.0, 165.0, 95.0, 77.0, 43.0, 32.0, 15.0, 7.0, 11.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0078125, -4.88067626953125, -4.7535400390625, -4.62640380859375, -4.499267578125, -4.37213134765625, -4.2449951171875, -4.11785888671875, -3.99072265625, -3.86358642578125, -3.7364501953125, -3.60931396484375, -3.482177734375, -3.35504150390625, -3.2279052734375, -3.10076904296875, -2.9736328125, -2.84649658203125, -2.7193603515625, -2.59222412109375, -2.465087890625, -2.33795166015625, -2.2108154296875, -2.08367919921875, -1.95654296875, -1.82940673828125, -1.7022705078125, -1.57513427734375, -1.447998046875, -1.32086181640625, -1.1937255859375, -1.06658935546875, -0.939453125, -0.81231689453125, -0.6851806640625, -0.55804443359375, -0.430908203125, -0.30377197265625, -0.1766357421875, -0.04949951171875, 0.07763671875, 0.20477294921875, 0.3319091796875, 0.45904541015625, 0.586181640625, 0.71331787109375, 0.8404541015625, 0.96759033203125, 1.0947265625, 1.22186279296875, 1.3489990234375, 1.47613525390625, 1.603271484375, 1.73040771484375, 1.8575439453125, 1.98468017578125, 2.11181640625, 2.23895263671875, 2.3660888671875, 2.49322509765625, 2.620361328125, 2.74749755859375, 2.8746337890625, 3.00177001953125, 3.12890625]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 15.0, 27.0, 49.0, 61.0, 72.0, 113.0, 111.0, 114.0, 104.0, 87.0, 84.0, 53.0, 36.0, 23.0, 14.0, 15.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.8818359375, -0.8624076843261719, -0.8429794311523438, -0.8235511779785156, -0.8041229248046875, -0.7846946716308594, -0.7652664184570312, -0.7458381652832031, -0.726409912109375, -0.7069816589355469, -0.6875534057617188, -0.6681251525878906, -0.6486968994140625, -0.6292686462402344, -0.6098403930664062, -0.5904121398925781, -0.57098388671875, -0.5515556335449219, -0.5321273803710938, -0.5126991271972656, -0.4932708740234375, -0.4738426208496094, -0.45441436767578125, -0.4349861145019531, -0.415557861328125, -0.3961296081542969, -0.37670135498046875, -0.3572731018066406, -0.3378448486328125, -0.3184165954589844, -0.29898834228515625, -0.2795600891113281, -0.2601318359375, -0.24070358276367188, -0.22127532958984375, -0.20184707641601562, -0.1824188232421875, -0.16299057006835938, -0.14356231689453125, -0.12413406372070312, -0.104705810546875, -0.08527755737304688, -0.06584930419921875, -0.046421051025390625, -0.0269927978515625, -0.007564544677734375, 0.01186370849609375, 0.031291961669921875, 0.05072021484375, 0.07014846801757812, 0.08957672119140625, 0.10900497436523438, 0.1284332275390625, 0.14786148071289062, 0.16728973388671875, 0.18671798706054688, 0.206146240234375, 0.22557449340820312, 0.24500274658203125, 0.2644309997558594, 0.2838592529296875, 0.3032875061035156, 0.32271575927734375, 0.3421440124511719, 0.361572265625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 8.0, 4.0, 13.0, 23.0, 16.0, 23.0, 50.0, 68.0, 96.0, 146.0, 222.0, 399.0, 696.0, 1197.0, 2569.0, 5824.0, 16353.0, 66914.0, 378571.0, 457903.0, 85113.0, 19763.0, 6561.0, 2817.0, 1336.0, 708.0, 427.0, 229.0, 165.0, 94.0, 71.0, 47.0, 18.0, 23.0, 15.0, 12.0, 8.0, 9.0, 6.0, 7.0, 2.0, 5.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-2.0234375, -1.96405029296875, -1.9046630859375, -1.84527587890625, -1.785888671875, -1.72650146484375, -1.6671142578125, -1.60772705078125, -1.54833984375, -1.48895263671875, -1.4295654296875, -1.37017822265625, -1.310791015625, -1.25140380859375, -1.1920166015625, -1.13262939453125, -1.0732421875, -1.01385498046875, -0.9544677734375, -0.89508056640625, -0.835693359375, -0.77630615234375, -0.7169189453125, -0.65753173828125, -0.59814453125, -0.53875732421875, -0.4793701171875, -0.41998291015625, -0.360595703125, -0.30120849609375, -0.2418212890625, -0.18243408203125, -0.123046875, -0.06365966796875, -0.0042724609375, 0.05511474609375, 0.114501953125, 0.17388916015625, 0.2332763671875, 0.29266357421875, 0.35205078125, 0.41143798828125, 0.4708251953125, 0.53021240234375, 0.589599609375, 0.64898681640625, 0.7083740234375, 0.76776123046875, 0.8271484375, 0.88653564453125, 0.9459228515625, 1.00531005859375, 1.064697265625, 1.12408447265625, 1.1834716796875, 1.24285888671875, 1.30224609375, 1.36163330078125, 1.4210205078125, 1.48040771484375, 1.539794921875, 1.59918212890625, 1.6585693359375, 1.71795654296875, 1.77734375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 4.0, 12.0, 15.0, 8.0, 25.0, 24.0, 44.0, 44.0, 48.0, 63.0, 62.0, 62.0, 67.0, 72.0, 72.0, 67.0, 60.0, 56.0, 42.0, 29.0, 34.0, 27.0, 15.0, 7.0, 9.0, 6.0, 1.0, 3.0, 0.0, 5.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.140625, -2.079345703125, -2.01806640625, -1.956787109375, -1.8955078125, -1.834228515625, -1.77294921875, -1.711669921875, -1.650390625, -1.589111328125, -1.52783203125, -1.466552734375, -1.4052734375, -1.343994140625, -1.28271484375, -1.221435546875, -1.16015625, -1.098876953125, -1.03759765625, -0.976318359375, -0.9150390625, -0.853759765625, -0.79248046875, -0.731201171875, -0.669921875, -0.608642578125, -0.54736328125, -0.486083984375, -0.4248046875, -0.363525390625, -0.30224609375, -0.240966796875, -0.1796875, -0.118408203125, -0.05712890625, 0.004150390625, 0.0654296875, 0.126708984375, 0.18798828125, 0.249267578125, 0.310546875, 0.371826171875, 0.43310546875, 0.494384765625, 0.5556640625, 0.616943359375, 0.67822265625, 0.739501953125, 0.80078125, 0.862060546875, 0.92333984375, 0.984619140625, 1.0458984375, 1.107177734375, 1.16845703125, 1.229736328125, 1.291015625, 1.352294921875, 1.41357421875, 1.474853515625, 1.5361328125, 1.597412109375, 1.65869140625, 1.719970703125, 1.78125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 5.0, 10.0, 9.0, 12.0, 13.0, 23.0, 27.0, 41.0, 75.0, 149.0, 245.0, 460.0, 967.0, 2252.0, 5983.0, 19926.0, 99874.0, 584676.0, 274431.0, 42256.0, 10455.0, 3641.0, 1524.0, 689.0, 319.0, 184.0, 118.0, 55.0, 55.0, 22.0, 12.0, 14.0, 8.0, 10.0, 2.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94970703125, -0.9223785400390625, -0.895050048828125, -0.8677215576171875, -0.84039306640625, -0.8130645751953125, -0.785736083984375, -0.7584075927734375, -0.7310791015625, -0.7037506103515625, -0.676422119140625, -0.6490936279296875, -0.62176513671875, -0.5944366455078125, -0.567108154296875, -0.5397796630859375, -0.512451171875, -0.4851226806640625, -0.457794189453125, -0.4304656982421875, -0.40313720703125, -0.3758087158203125, -0.348480224609375, -0.3211517333984375, -0.2938232421875, -0.2664947509765625, -0.239166259765625, -0.2118377685546875, -0.18450927734375, -0.1571807861328125, -0.129852294921875, -0.1025238037109375, -0.0751953125, -0.0478668212890625, -0.020538330078125, 0.0067901611328125, 0.03411865234375, 0.0614471435546875, 0.088775634765625, 0.1161041259765625, 0.1434326171875, 0.1707611083984375, 0.198089599609375, 0.2254180908203125, 0.25274658203125, 0.2800750732421875, 0.307403564453125, 0.3347320556640625, 0.362060546875, 0.3893890380859375, 0.416717529296875, 0.4440460205078125, 0.47137451171875, 0.4987030029296875, 0.526031494140625, 0.5533599853515625, 0.5806884765625, 0.6080169677734375, 0.635345458984375, 0.6626739501953125, 0.69000244140625, 0.7173309326171875, 0.744659423828125, 0.7719879150390625, 0.79931640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 5.0, 6.0, 4.0, 11.0, 12.0, 19.0, 25.0, 39.0, 55.0, 88.0, 139.0, 160.0, 130.0, 100.0, 69.0, 37.0, 23.0, 24.0, 18.0, 13.0, 6.0, 5.0, 6.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00021910667419433594, -0.00021238625049591064, -0.00020566582679748535, -0.00019894540309906006, -0.00019222497940063477, -0.00018550455570220947, -0.00017878413200378418, -0.0001720637083053589, -0.0001653432846069336, -0.0001586228609085083, -0.000151902437210083, -0.00014518201351165771, -0.00013846158981323242, -0.00013174116611480713, -0.00012502074241638184, -0.00011830031871795654, -0.00011157989501953125, -0.00010485947132110596, -9.813904762268066e-05, -9.141862392425537e-05, -8.469820022583008e-05, -7.797777652740479e-05, -7.125735282897949e-05, -6.45369291305542e-05, -5.7816505432128906e-05, -5.109608173370361e-05, -4.437565803527832e-05, -3.765523433685303e-05, -3.0934810638427734e-05, -2.421438694000244e-05, -1.749396324157715e-05, -1.0773539543151855e-05, -4.0531158447265625e-06, 2.6673078536987305e-06, 9.387731552124023e-06, 1.6108155250549316e-05, 2.282857894897461e-05, 2.9549002647399902e-05, 3.6269426345825195e-05, 4.298985004425049e-05, 4.971027374267578e-05, 5.6430697441101074e-05, 6.315112113952637e-05, 6.987154483795166e-05, 7.659196853637695e-05, 8.331239223480225e-05, 9.003281593322754e-05, 9.675323963165283e-05, 0.00010347366333007812, 0.00011019408702850342, 0.00011691451072692871, 0.000123634934425354, 0.0001303553581237793, 0.0001370757818222046, 0.00014379620552062988, 0.00015051662921905518, 0.00015723705291748047, 0.00016395747661590576, 0.00017067790031433105, 0.00017739832401275635, 0.00018411874771118164, 0.00019083917140960693, 0.00019755959510803223, 0.00020428001880645752, 0.0002110004425048828]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 3.0, 9.0, 9.0, 20.0, 24.0, 32.0, 76.0, 148.0, 320.0, 835.0, 2884.0, 16505.0, 267738.0, 712725.0, 39845.0, 5273.0, 1225.0, 466.0, 191.0, 102.0, 47.0, 31.0, 21.0, 14.0, 7.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2802734375, -1.2294464111328125, -1.178619384765625, -1.1277923583984375, -1.07696533203125, -1.0261383056640625, -0.975311279296875, -0.9244842529296875, -0.8736572265625, -0.8228302001953125, -0.772003173828125, -0.7211761474609375, -0.67034912109375, -0.6195220947265625, -0.568695068359375, -0.5178680419921875, -0.467041015625, -0.4162139892578125, -0.365386962890625, -0.3145599365234375, -0.26373291015625, -0.2129058837890625, -0.162078857421875, -0.1112518310546875, -0.0604248046875, -0.0095977783203125, 0.041229248046875, 0.0920562744140625, 0.14288330078125, 0.1937103271484375, 0.244537353515625, 0.2953643798828125, 0.34619140625, 0.3970184326171875, 0.447845458984375, 0.4986724853515625, 0.54949951171875, 0.6003265380859375, 0.651153564453125, 0.7019805908203125, 0.7528076171875, 0.8036346435546875, 0.854461669921875, 0.9052886962890625, 0.95611572265625, 1.0069427490234375, 1.057769775390625, 1.1085968017578125, 1.159423828125, 1.2102508544921875, 1.261077880859375, 1.3119049072265625, 1.36273193359375, 1.4135589599609375, 1.464385986328125, 1.5152130126953125, 1.5660400390625, 1.6168670654296875, 1.667694091796875, 1.7185211181640625, 1.76934814453125, 1.8201751708984375, 1.871002197265625, 1.9218292236328125, 1.97265625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 8.0, 11.0, 22.0, 14.0, 33.0, 49.0, 55.0, 70.0, 88.0, 97.0, 92.0, 105.0, 67.0, 80.0, 53.0, 38.0, 27.0, 21.0, 11.0, 11.0, 10.0, 10.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5126953125, -0.4925079345703125, -0.472320556640625, -0.4521331787109375, -0.43194580078125, -0.4117584228515625, -0.391571044921875, -0.3713836669921875, -0.3511962890625, -0.3310089111328125, -0.310821533203125, -0.2906341552734375, -0.27044677734375, -0.2502593994140625, -0.230072021484375, -0.2098846435546875, -0.189697265625, -0.1695098876953125, -0.149322509765625, -0.1291351318359375, -0.10894775390625, -0.0887603759765625, -0.068572998046875, -0.0483856201171875, -0.0281982421875, -0.0080108642578125, 0.012176513671875, 0.0323638916015625, 0.05255126953125, 0.0727386474609375, 0.092926025390625, 0.1131134033203125, 0.13330078125, 0.1534881591796875, 0.173675537109375, 0.1938629150390625, 0.21405029296875, 0.2342376708984375, 0.254425048828125, 0.2746124267578125, 0.2947998046875, 0.3149871826171875, 0.335174560546875, 0.3553619384765625, 0.37554931640625, 0.3957366943359375, 0.415924072265625, 0.4361114501953125, 0.456298828125, 0.4764862060546875, 0.496673583984375, 0.5168609619140625, 0.53704833984375, 0.5572357177734375, 0.577423095703125, 0.5976104736328125, 0.6177978515625, 0.6379852294921875, 0.658172607421875, 0.6783599853515625, 0.69854736328125, 0.7187347412109375, 0.738922119140625, 0.7591094970703125, 0.779296875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 9.0, 12.0, 21.0, 39.0, 82.0, 185.0, 245.0, 219.0, 96.0, 45.0, 23.0, 15.0, 5.0, 4.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.381412506103516, -26.767169952392578, -26.15292739868164, -25.538684844970703, -24.924442291259766, -24.310199737548828, -23.69595718383789, -23.081716537475586, -22.46747398376465, -21.85323143005371, -21.238988876342773, -20.624746322631836, -20.0105037689209, -19.396263122558594, -18.782020568847656, -18.16777801513672, -17.55353546142578, -16.939292907714844, -16.325050354003906, -15.710807800292969, -15.096566200256348, -14.48232364654541, -13.868081092834473, -13.253839492797852, -12.639595031738281, -12.025352478027344, -11.411109924316406, -10.796867370605469, -10.182625770568848, -9.56838321685791, -8.954140663146973, -8.339899063110352, -7.7256574630737305, -7.111414909362793, -6.497172832489014, -5.882930278778076, -5.268688201904297, -4.654445648193359, -4.040203094482422, -3.4259610176086426, -2.811718463897705, -2.1974761486053467, -1.5832337141036987, -0.9689912796020508, -0.3547489643096924, 0.259493350982666, 0.8737359046936035, 1.4879779815673828, 2.1022205352783203, 2.7164628505706787, 3.330705165863037, 3.9449477195739746, 4.559189796447754, 5.173432350158691, 5.787674903869629, 6.401916980743408, 7.016159534454346, 7.630402088165283, 8.244644165039062, 8.85888671875, 9.473129272460938, 10.087371826171875, 10.701614379882812, 11.315855979919434, 11.930098533630371]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 6.0, 4.0, 3.0, 4.0, 5.0, 6.0, 17.0, 15.0, 14.0, 19.0, 19.0, 24.0, 31.0, 36.0, 37.0, 44.0, 52.0, 43.0, 46.0, 53.0, 70.0, 49.0, 53.0, 50.0, 39.0, 36.0, 42.0, 33.0, 27.0, 18.0, 22.0, 16.0, 10.0, 15.0, 15.0, 4.0, 6.0, 6.0, 4.0, 2.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-11.464635848999023, -11.16545295715332, -10.866271018981934, -10.567089080810547, -10.267906188964844, -9.96872329711914, -9.669541358947754, -9.370359420776367, -9.071176528930664, -8.771993637084961, -8.472811698913574, -8.173629760742188, -7.874446868896484, -7.5752644538879395, -7.2760820388793945, -6.97689962387085, -6.677717208862305, -6.37853479385376, -6.079352378845215, -5.78016996383667, -5.480987548828125, -5.18180513381958, -4.882622718811035, -4.58344030380249, -4.284257888793945, -3.9850754737854004, -3.6858930587768555, -3.3867106437683105, -3.0875282287597656, -2.7883458137512207, -2.489163398742676, -2.189980983734131, -1.8907976150512695, -1.5916152000427246, -1.2924327850341797, -0.9932503700256348, -0.6940679550170898, -0.3948855400085449, -0.095703125, 0.20347929000854492, 0.5026617050170898, 0.8018441200256348, 1.1010265350341797, 1.4002089500427246, 1.6993913650512695, 1.9985737800598145, 2.2977561950683594, 2.5969386100769043, 2.896121025085449, 3.195303440093994, 3.494485855102539, 3.793668270111084, 4.092850685119629, 4.392033100128174, 4.691215515136719, 4.990397930145264, 5.289580345153809, 5.5887627601623535, 5.887945175170898, 6.187127590179443, 6.486310005187988, 6.785492420196533, 7.084674835205078, 7.383857250213623, 7.683039665222168]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 11.0, 6.0, 7.0, 18.0, 17.0, 16.0, 27.0, 41.0, 50.0, 71.0, 93.0, 115.0, 201.0, 291.0, 503.0, 985.0, 2153.0, 6439.0, 28275.0, 266102.0, 3792279.0, 77106.0, 13230.0, 3617.0, 1327.0, 623.0, 317.0, 128.0, 82.0, 55.0, 45.0, 19.0, 10.0, 11.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.734375, -4.627410888671875, -4.52044677734375, -4.413482666015625, -4.3065185546875, -4.199554443359375, -4.09259033203125, -3.985626220703125, -3.878662109375, -3.771697998046875, -3.66473388671875, -3.557769775390625, -3.4508056640625, -3.343841552734375, -3.23687744140625, -3.129913330078125, -3.02294921875, -2.915985107421875, -2.80902099609375, -2.702056884765625, -2.5950927734375, -2.488128662109375, -2.38116455078125, -2.274200439453125, -2.167236328125, -2.060272216796875, -1.95330810546875, -1.846343994140625, -1.7393798828125, -1.632415771484375, -1.52545166015625, -1.418487548828125, -1.3115234375, -1.204559326171875, -1.09759521484375, -0.990631103515625, -0.8836669921875, -0.776702880859375, -0.66973876953125, -0.562774658203125, -0.455810546875, -0.348846435546875, -0.24188232421875, -0.134918212890625, -0.0279541015625, 0.079010009765625, 0.18597412109375, 0.292938232421875, 0.39990234375, 0.506866455078125, 0.61383056640625, 0.720794677734375, 0.8277587890625, 0.934722900390625, 1.04168701171875, 1.148651123046875, 1.255615234375, 1.362579345703125, 1.46954345703125, 1.576507568359375, 1.6834716796875, 1.790435791015625, 1.89739990234375, 2.004364013671875, 2.111328125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 3.0, 2.0, 4.0, 12.0, 25.0, 24.0, 43.0, 67.0, 70.0, 82.0, 105.0, 105.0, 119.0, 82.0, 67.0, 68.0, 47.0, 31.0, 16.0, 19.0, 5.0, 6.0, 1.0, 2.0, 2.0, 1.0, 4.0], "bins": [-0.939453125, -0.9200859069824219, -0.9007186889648438, -0.8813514709472656, -0.8619842529296875, -0.8426170349121094, -0.8232498168945312, -0.8038825988769531, -0.784515380859375, -0.7651481628417969, -0.7457809448242188, -0.7264137268066406, -0.7070465087890625, -0.6876792907714844, -0.6683120727539062, -0.6489448547363281, -0.62957763671875, -0.6102104187011719, -0.5908432006835938, -0.5714759826660156, -0.5521087646484375, -0.5327415466308594, -0.5133743286132812, -0.4940071105957031, -0.474639892578125, -0.4552726745605469, -0.43590545654296875, -0.4165382385253906, -0.3971710205078125, -0.3778038024902344, -0.35843658447265625, -0.3390693664550781, -0.3197021484375, -0.3003349304199219, -0.28096771240234375, -0.2616004943847656, -0.2422332763671875, -0.22286605834960938, -0.20349884033203125, -0.18413162231445312, -0.164764404296875, -0.14539718627929688, -0.12602996826171875, -0.10666275024414062, -0.0872955322265625, -0.06792831420898438, -0.04856109619140625, -0.029193878173828125, -0.00982666015625, 0.009540557861328125, 0.02890777587890625, 0.048274993896484375, 0.0676422119140625, 0.08700942993164062, 0.10637664794921875, 0.12574386596679688, 0.145111083984375, 0.16447830200195312, 0.18384552001953125, 0.20321273803710938, 0.2225799560546875, 0.24194717407226562, 0.26131439208984375, 0.2806816101074219, 0.300048828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 9.0, 20.0, 61.0, 121.0, 321.0, 1232.0, 36929.0, 4151503.0, 3259.0, 487.0, 179.0, 86.0, 40.0, 22.0, 7.0, 7.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.7578125, -11.1463623046875, -10.534912109375, -9.9234619140625, -9.31201171875, -8.7005615234375, -8.089111328125, -7.4776611328125, -6.8662109375, -6.2547607421875, -5.643310546875, -5.0318603515625, -4.42041015625, -3.8089599609375, -3.197509765625, -2.5860595703125, -1.974609375, -1.3631591796875, -0.751708984375, -0.1402587890625, 0.47119140625, 1.0826416015625, 1.694091796875, 2.3055419921875, 2.9169921875, 3.5284423828125, 4.139892578125, 4.7513427734375, 5.36279296875, 5.9742431640625, 6.585693359375, 7.1971435546875, 7.80859375, 8.4200439453125, 9.031494140625, 9.6429443359375, 10.25439453125, 10.8658447265625, 11.477294921875, 12.0887451171875, 12.7001953125, 13.3116455078125, 13.923095703125, 14.5345458984375, 15.14599609375, 15.7574462890625, 16.368896484375, 16.9803466796875, 17.591796875, 18.2032470703125, 18.814697265625, 19.4261474609375, 20.03759765625, 20.6490478515625, 21.260498046875, 21.8719482421875, 22.4833984375, 23.0948486328125, 23.706298828125, 24.3177490234375, 24.92919921875, 25.5406494140625, 26.152099609375, 26.7635498046875, 27.375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 12.0, 9.0, 31.0, 124.0, 851.0, 2826.0, 166.0, 37.0, 13.0, 8.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.25390625, -2.1473388671875, -2.040771484375, -1.9342041015625, -1.82763671875, -1.7210693359375, -1.614501953125, -1.5079345703125, -1.4013671875, -1.2947998046875, -1.188232421875, -1.0816650390625, -0.97509765625, -0.8685302734375, -0.761962890625, -0.6553955078125, -0.548828125, -0.4422607421875, -0.335693359375, -0.2291259765625, -0.12255859375, -0.0159912109375, 0.090576171875, 0.1971435546875, 0.3037109375, 0.4102783203125, 0.516845703125, 0.6234130859375, 0.72998046875, 0.8365478515625, 0.943115234375, 1.0496826171875, 1.15625, 1.2628173828125, 1.369384765625, 1.4759521484375, 1.58251953125, 1.6890869140625, 1.795654296875, 1.9022216796875, 2.0087890625, 2.1153564453125, 2.221923828125, 2.3284912109375, 2.43505859375, 2.5416259765625, 2.648193359375, 2.7547607421875, 2.861328125, 2.9678955078125, 3.074462890625, 3.1810302734375, 3.28759765625, 3.3941650390625, 3.500732421875, 3.6072998046875, 3.7138671875, 3.8204345703125, 3.927001953125, 4.0335693359375, 4.14013671875, 4.2467041015625, 4.353271484375, 4.4598388671875, 4.56640625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 5.0, 7.0, 12.0, 18.0, 55.0, 151.0, 296.0, 281.0, 107.0, 37.0, 20.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.575599670410156, -19.13873291015625, -18.701866149902344, -18.264999389648438, -17.828134536743164, -17.391267776489258, -16.95440101623535, -16.517534255981445, -16.08066749572754, -15.643800735473633, -15.206934928894043, -14.770068168640137, -14.33320140838623, -13.89633560180664, -13.459468841552734, -13.022602081298828, -12.585735321044922, -12.148868560791016, -11.712002754211426, -11.27513599395752, -10.838269233703613, -10.401403427124023, -9.964536666870117, -9.527669906616211, -9.090804100036621, -8.653937339782715, -8.217071533203125, -7.780204772949219, -7.3433380126953125, -6.9064717292785645, -6.469605445861816, -6.03273868560791, -5.595871925354004, -5.159005641937256, -4.72213888168335, -4.285272598266602, -3.8484058380126953, -3.4115395545959473, -2.97467303276062, -2.537806510925293, -2.100939989089966, -1.6640734672546387, -1.2272069454193115, -0.7903405427932739, -0.3534740209579468, 0.08339238166809082, 0.520258903503418, 0.9571254253387451, 1.3939919471740723, 1.8308584690093994, 2.2677249908447266, 2.7045912742614746, 3.141458034515381, 3.578324317932129, 4.015191078186035, 4.452057361602783, 4.888923645019531, 5.325789928436279, 5.7626566886901855, 6.199522972106934, 6.63638973236084, 7.073256015777588, 7.510122299194336, 7.946989059448242, 8.383855819702148]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 8.0, 7.0, 13.0, 17.0, 33.0, 55.0, 50.0, 70.0, 86.0, 102.0, 101.0, 87.0, 96.0, 80.0, 60.0, 53.0, 29.0, 24.0, 14.0, 8.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.491847991943359, -6.2750935554504395, -6.0583391189575195, -5.8415846824646, -5.62483024597168, -5.40807580947876, -5.19132137298584, -4.974567413330078, -4.7578125, -4.54105806350708, -4.32430362701416, -4.10754919052124, -3.8907947540283203, -3.6740403175354004, -3.4572861194610596, -3.2405316829681396, -3.023777484893799, -2.807023048400879, -2.590268611907959, -2.373514175415039, -2.156759738922119, -1.9400054216384888, -1.7232511043548584, -1.5064966678619385, -1.2897422313690186, -1.0729877948760986, -0.8562334179878235, -0.6394790410995483, -0.4227246046066284, -0.2059701681137085, 0.010784149169921875, 0.2275385856628418, 0.4442930221557617, 0.6610474586486816, 0.8778018355369568, 1.094556212425232, 1.3113106489181519, 1.5280650854110718, 1.7448194026947021, 1.961573839187622, 2.178328275680542, 2.395082712173462, 2.611837148666382, 2.8285913467407227, 3.0453457832336426, 3.2621002197265625, 3.4788546562194824, 3.6956090927124023, 3.9123635292053223, 4.129117965698242, 4.345872402191162, 4.562626838684082, 4.779381275177002, 4.996135711669922, 5.212889671325684, 5.429644584655762, 5.646398544311523, 5.863152980804443, 6.079907417297363, 6.296661853790283, 6.513416290283203, 6.730170726776123, 6.946925163269043, 7.163679122924805, 7.380434036254883]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 7.0, 6.0, 6.0, 7.0, 21.0, 21.0, 28.0, 31.0, 39.0, 56.0, 66.0, 89.0, 125.0, 167.0, 229.0, 370.0, 558.0, 945.0, 2059.0, 5024.0, 17804.0, 83375.0, 422726.0, 408494.0, 79628.0, 17084.0, 4887.0, 1925.0, 1001.0, 542.0, 333.0, 213.0, 173.0, 130.0, 82.0, 60.0, 60.0, 40.0, 36.0, 29.0, 17.0, 12.0, 16.0, 7.0, 8.0, 4.0, 5.0, 5.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.103515625, -2.03094482421875, -1.9583740234375, -1.88580322265625, -1.813232421875, -1.74066162109375, -1.6680908203125, -1.59552001953125, -1.52294921875, -1.45037841796875, -1.3778076171875, -1.30523681640625, -1.232666015625, -1.16009521484375, -1.0875244140625, -1.01495361328125, -0.9423828125, -0.86981201171875, -0.7972412109375, -0.72467041015625, -0.652099609375, -0.57952880859375, -0.5069580078125, -0.43438720703125, -0.36181640625, -0.28924560546875, -0.2166748046875, -0.14410400390625, -0.071533203125, 0.00103759765625, 0.0736083984375, 0.14617919921875, 0.21875, 0.29132080078125, 0.3638916015625, 0.43646240234375, 0.509033203125, 0.58160400390625, 0.6541748046875, 0.72674560546875, 0.79931640625, 0.87188720703125, 0.9444580078125, 1.01702880859375, 1.089599609375, 1.16217041015625, 1.2347412109375, 1.30731201171875, 1.3798828125, 1.45245361328125, 1.5250244140625, 1.59759521484375, 1.670166015625, 1.74273681640625, 1.8153076171875, 1.88787841796875, 1.96044921875, 2.03302001953125, 2.1055908203125, 2.17816162109375, 2.250732421875, 2.32330322265625, 2.3958740234375, 2.46844482421875, 2.541015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 8.0, 19.0, 35.0, 46.0, 72.0, 88.0, 108.0, 141.0, 132.0, 104.0, 84.0, 63.0, 46.0, 23.0, 15.0, 5.0, 9.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7958984375, -0.7700424194335938, -0.7441864013671875, -0.7183303833007812, -0.692474365234375, -0.6666183471679688, -0.6407623291015625, -0.6149063110351562, -0.58905029296875, -0.5631942749023438, -0.5373382568359375, -0.5114822387695312, -0.485626220703125, -0.45977020263671875, -0.4339141845703125, -0.40805816650390625, -0.3822021484375, -0.35634613037109375, -0.3304901123046875, -0.30463409423828125, -0.278778076171875, -0.25292205810546875, -0.2270660400390625, -0.20121002197265625, -0.17535400390625, -0.14949798583984375, -0.1236419677734375, -0.09778594970703125, -0.071929931640625, -0.04607391357421875, -0.0202178955078125, 0.00563812255859375, 0.031494140625, 0.05735015869140625, 0.0832061767578125, 0.10906219482421875, 0.134918212890625, 0.16077423095703125, 0.1866302490234375, 0.21248626708984375, 0.23834228515625, 0.26419830322265625, 0.2900543212890625, 0.31591033935546875, 0.341766357421875, 0.36762237548828125, 0.3934783935546875, 0.41933441162109375, 0.4451904296875, 0.47104644775390625, 0.4969024658203125, 0.5227584838867188, 0.548614501953125, 0.5744705200195312, 0.6003265380859375, 0.6261825561523438, 0.65203857421875, 0.6778945922851562, 0.7037506103515625, 0.7296066284179688, 0.755462646484375, 0.7813186645507812, 0.8071746826171875, 0.8330307006835938, 0.85888671875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 7.0, 8.0, 10.0, 14.0, 32.0, 31.0, 55.0, 90.0, 144.0, 208.0, 408.0, 755.0, 1577.0, 3647.0, 8377.0, 22685.0, 68040.0, 210164.0, 397958.0, 221776.0, 72529.0, 23957.0, 8842.0, 3693.0, 1685.0, 806.0, 407.0, 228.0, 139.0, 72.0, 58.0, 44.0, 35.0, 20.0, 7.0, 14.0, 10.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1708984375, -1.133758544921875, -1.09661865234375, -1.059478759765625, -1.0223388671875, -0.985198974609375, -0.94805908203125, -0.910919189453125, -0.873779296875, -0.836639404296875, -0.79949951171875, -0.762359619140625, -0.7252197265625, -0.688079833984375, -0.65093994140625, -0.613800048828125, -0.57666015625, -0.539520263671875, -0.50238037109375, -0.465240478515625, -0.4281005859375, -0.390960693359375, -0.35382080078125, -0.316680908203125, -0.279541015625, -0.242401123046875, -0.20526123046875, -0.168121337890625, -0.1309814453125, -0.093841552734375, -0.05670166015625, -0.019561767578125, 0.017578125, 0.054718017578125, 0.09185791015625, 0.128997802734375, 0.1661376953125, 0.203277587890625, 0.24041748046875, 0.277557373046875, 0.314697265625, 0.351837158203125, 0.38897705078125, 0.426116943359375, 0.4632568359375, 0.500396728515625, 0.53753662109375, 0.574676513671875, 0.61181640625, 0.648956298828125, 0.68609619140625, 0.723236083984375, 0.7603759765625, 0.797515869140625, 0.83465576171875, 0.871795654296875, 0.908935546875, 0.946075439453125, 0.98321533203125, 1.020355224609375, 1.0574951171875, 1.094635009765625, 1.13177490234375, 1.168914794921875, 1.2060546875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 7.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 12.0, 4.0, 9.0, 17.0, 19.0, 15.0, 25.0, 24.0, 35.0, 28.0, 30.0, 48.0, 36.0, 53.0, 44.0, 52.0, 38.0, 43.0, 47.0, 44.0, 33.0, 34.0, 46.0, 45.0, 38.0, 20.0, 23.0, 24.0, 17.0, 14.0, 12.0, 16.0, 10.0, 9.0, 7.0, 8.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2587890625, -1.2192535400390625, -1.179718017578125, -1.1401824951171875, -1.10064697265625, -1.0611114501953125, -1.021575927734375, -0.9820404052734375, -0.9425048828125, -0.9029693603515625, -0.863433837890625, -0.8238983154296875, -0.78436279296875, -0.7448272705078125, -0.705291748046875, -0.6657562255859375, -0.626220703125, -0.5866851806640625, -0.547149658203125, -0.5076141357421875, -0.46807861328125, -0.4285430908203125, -0.389007568359375, -0.3494720458984375, -0.3099365234375, -0.2704010009765625, -0.230865478515625, -0.1913299560546875, -0.15179443359375, -0.1122589111328125, -0.072723388671875, -0.0331878662109375, 0.00634765625, 0.0458831787109375, 0.085418701171875, 0.1249542236328125, 0.16448974609375, 0.2040252685546875, 0.243560791015625, 0.2830963134765625, 0.3226318359375, 0.3621673583984375, 0.401702880859375, 0.4412384033203125, 0.48077392578125, 0.5203094482421875, 0.559844970703125, 0.5993804931640625, 0.638916015625, 0.6784515380859375, 0.717987060546875, 0.7575225830078125, 0.79705810546875, 0.8365936279296875, 0.876129150390625, 0.9156646728515625, 0.9552001953125, 0.9947357177734375, 1.034271240234375, 1.0738067626953125, 1.11334228515625, 1.1528778076171875, 1.192413330078125, 1.2319488525390625, 1.271484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 10.0, 9.0, 22.0, 27.0, 35.0, 76.0, 153.0, 297.0, 722.0, 2305.0, 9008.0, 59966.0, 552111.0, 377083.0, 37448.0, 6377.0, 1731.0, 619.0, 267.0, 116.0, 66.0, 35.0, 22.0, 15.0, 13.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3558197021484375, -1.320037841796875, -1.2842559814453125, -1.24847412109375, -1.2126922607421875, -1.176910400390625, -1.1411285400390625, -1.1053466796875, -1.0695648193359375, -1.033782958984375, -0.9980010986328125, -0.96221923828125, -0.9264373779296875, -0.890655517578125, -0.8548736572265625, -0.819091796875, -0.7833099365234375, -0.747528076171875, -0.7117462158203125, -0.67596435546875, -0.6401824951171875, -0.604400634765625, -0.5686187744140625, -0.5328369140625, -0.4970550537109375, -0.461273193359375, -0.4254913330078125, -0.38970947265625, -0.3539276123046875, -0.318145751953125, -0.2823638916015625, -0.24658203125, -0.2108001708984375, -0.175018310546875, -0.1392364501953125, -0.10345458984375, -0.0676727294921875, -0.031890869140625, 0.0038909912109375, 0.0396728515625, 0.0754547119140625, 0.111236572265625, 0.1470184326171875, 0.18280029296875, 0.2185821533203125, 0.254364013671875, 0.2901458740234375, 0.325927734375, 0.3617095947265625, 0.397491455078125, 0.4332733154296875, 0.46905517578125, 0.5048370361328125, 0.540618896484375, 0.5764007568359375, 0.6121826171875, 0.6479644775390625, 0.683746337890625, 0.7195281982421875, 0.75531005859375, 0.7910919189453125, 0.826873779296875, 0.8626556396484375, 0.8984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 1.0, 2.0, 7.0, 6.0, 13.0, 14.0, 13.0, 31.0, 29.0, 39.0, 47.0, 80.0, 77.0, 94.0, 96.0, 84.0, 89.0, 61.0, 43.0, 31.0, 31.0, 23.0, 13.0, 25.0, 17.0, 9.0, 8.0, 6.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001380443572998047, -0.00013352185487747192, -0.00012899935245513916, -0.0001244768500328064, -0.00011995434761047363, -0.00011543184518814087, -0.0001109093427658081, -0.00010638684034347534, -0.00010186433792114258, -9.734183549880981e-05, -9.281933307647705e-05, -8.829683065414429e-05, -8.377432823181152e-05, -7.925182580947876e-05, -7.4729323387146e-05, -7.020682096481323e-05, -6.568431854248047e-05, -6.11618161201477e-05, -5.663931369781494e-05, -5.211681127548218e-05, -4.7594308853149414e-05, -4.307180643081665e-05, -3.854930400848389e-05, -3.402680158615112e-05, -2.950429916381836e-05, -2.4981796741485596e-05, -2.0459294319152832e-05, -1.593679189682007e-05, -1.1414289474487305e-05, -6.891787052154541e-06, -2.3692846298217773e-06, 2.1532177925109863e-06, 6.67572021484375e-06, 1.1198222637176514e-05, 1.5720725059509277e-05, 2.024322748184204e-05, 2.4765729904174805e-05, 2.928823232650757e-05, 3.381073474884033e-05, 3.8333237171173096e-05, 4.285573959350586e-05, 4.737824201583862e-05, 5.190074443817139e-05, 5.642324686050415e-05, 6.0945749282836914e-05, 6.546825170516968e-05, 6.999075412750244e-05, 7.45132565498352e-05, 7.903575897216797e-05, 8.355826139450073e-05, 8.80807638168335e-05, 9.260326623916626e-05, 9.712576866149902e-05, 0.00010164827108383179, 0.00010617077350616455, 0.00011069327592849731, 0.00011521577835083008, 0.00011973828077316284, 0.0001242607831954956, 0.00012878328561782837, 0.00013330578804016113, 0.0001378282904624939, 0.00014235079288482666, 0.00014687329530715942, 0.0001513957977294922]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 9.0, 1.0, 15.0, 10.0, 12.0, 26.0, 20.0, 61.0, 79.0, 113.0, 198.0, 364.0, 745.0, 1612.0, 3918.0, 11558.0, 44907.0, 246908.0, 564718.0, 132976.0, 27175.0, 7768.0, 2770.0, 1234.0, 607.0, 312.0, 173.0, 91.0, 46.0, 47.0, 22.0, 16.0, 16.0, 6.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.91943359375, -0.8909912109375, -0.862548828125, -0.8341064453125, -0.8056640625, -0.7772216796875, -0.748779296875, -0.7203369140625, -0.69189453125, -0.6634521484375, -0.635009765625, -0.6065673828125, -0.578125, -0.5496826171875, -0.521240234375, -0.4927978515625, -0.46435546875, -0.4359130859375, -0.407470703125, -0.3790283203125, -0.3505859375, -0.3221435546875, -0.293701171875, -0.2652587890625, -0.23681640625, -0.2083740234375, -0.179931640625, -0.1514892578125, -0.123046875, -0.0946044921875, -0.066162109375, -0.0377197265625, -0.00927734375, 0.0191650390625, 0.047607421875, 0.0760498046875, 0.1044921875, 0.1329345703125, 0.161376953125, 0.1898193359375, 0.21826171875, 0.2467041015625, 0.275146484375, 0.3035888671875, 0.33203125, 0.3604736328125, 0.388916015625, 0.4173583984375, 0.44580078125, 0.4742431640625, 0.502685546875, 0.5311279296875, 0.5595703125, 0.5880126953125, 0.616455078125, 0.6448974609375, 0.67333984375, 0.7017822265625, 0.730224609375, 0.7586669921875, 0.787109375, 0.8155517578125, 0.843994140625, 0.8724365234375, 0.90087890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 5.0, 4.0, 11.0, 6.0, 13.0, 16.0, 26.0, 25.0, 40.0, 47.0, 48.0, 85.0, 73.0, 120.0, 69.0, 84.0, 79.0, 57.0, 37.0, 24.0, 40.0, 22.0, 13.0, 11.0, 13.0, 3.0, 8.0, 4.0, 1.0, 10.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53662109375, -0.5174484252929688, -0.4982757568359375, -0.47910308837890625, -0.459930419921875, -0.44075775146484375, -0.4215850830078125, -0.40241241455078125, -0.38323974609375, -0.36406707763671875, -0.3448944091796875, -0.32572174072265625, -0.306549072265625, -0.28737640380859375, -0.2682037353515625, -0.24903106689453125, -0.2298583984375, -0.21068572998046875, -0.1915130615234375, -0.17234039306640625, -0.153167724609375, -0.13399505615234375, -0.1148223876953125, -0.09564971923828125, -0.07647705078125, -0.05730438232421875, -0.0381317138671875, -0.01895904541015625, 0.000213623046875, 0.01938629150390625, 0.0385589599609375, 0.05773162841796875, 0.076904296875, 0.09607696533203125, 0.1152496337890625, 0.13442230224609375, 0.153594970703125, 0.17276763916015625, 0.1919403076171875, 0.21111297607421875, 0.23028564453125, 0.24945831298828125, 0.2686309814453125, 0.28780364990234375, 0.306976318359375, 0.32614898681640625, 0.3453216552734375, 0.36449432373046875, 0.3836669921875, 0.40283966064453125, 0.4220123291015625, 0.44118499755859375, 0.460357666015625, 0.47953033447265625, 0.4987030029296875, 0.5178756713867188, 0.53704833984375, 0.5562210083007812, 0.5753936767578125, 0.5945663452148438, 0.613739013671875, 0.6329116821289062, 0.6520843505859375, 0.6712570190429688, 0.6904296875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 6.0, 8.0, 79.0, 183.0, 340.0, 244.0, 95.0, 31.0, 7.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.347625732421875, -32.631187438964844, -31.914751052856445, -31.198312759399414, -30.481874465942383, -29.765438079833984, -29.048999786376953, -28.332561492919922, -27.61612319946289, -26.89968490600586, -26.18324851989746, -25.46681022644043, -24.7503719329834, -24.033935546875, -23.31749725341797, -22.601058959960938, -21.88462257385254, -21.168184280395508, -20.45174789428711, -19.735309600830078, -19.018871307373047, -18.302433013916016, -17.585996627807617, -16.869558334350586, -16.153121948242188, -15.436684608459473, -14.720246315002441, -14.003808975219727, -13.287370681762695, -12.57093334197998, -11.854496002197266, -11.138057708740234, -10.421618461608887, -9.705181121826172, -8.98874282836914, -8.272305488586426, -7.555867671966553, -6.83942985534668, -6.122992515563965, -5.406554698944092, -4.690116882324219, -3.9736790657043457, -3.2572414875030518, -2.540803909301758, -1.8243660926818848, -1.1079282760620117, -0.3914909362792969, 0.32494688034057617, 1.0413846969604492, 1.7578223943710327, 2.474260091781616, 3.19069766998291, 3.907135486602783, 4.623573303222656, 5.340010643005371, 6.056448459625244, 6.772886276245117, 7.48932409286499, 8.205761909484863, 8.922199249267578, 9.63863754272461, 10.355074882507324, 11.071512222290039, 11.78795051574707, 12.504387855529785]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 11.0, 5.0, 7.0, 10.0, 13.0, 9.0, 17.0, 24.0, 36.0, 22.0, 44.0, 48.0, 39.0, 53.0, 46.0, 50.0, 63.0, 62.0, 49.0, 50.0, 52.0, 47.0, 37.0, 36.0, 33.0, 22.0, 26.0, 20.0, 20.0, 17.0, 12.0, 8.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.689992427825928, -7.420827865600586, -7.151663780212402, -6.882499694824219, -6.613335132598877, -6.344170570373535, -6.075006484985352, -5.805842399597168, -5.536677837371826, -5.267513275146484, -4.998349189758301, -4.729185104370117, -4.460020542144775, -4.190855979919434, -3.92169189453125, -3.6525275707244873, -3.3833632469177246, -3.114198923110962, -2.845034599304199, -2.5758702754974365, -2.306705951690674, -2.037541627883911, -1.7683773040771484, -1.4992129802703857, -1.230048656463623, -0.9608843326568604, -0.6917200088500977, -0.42255568504333496, -0.15339136123657227, 0.11577296257019043, 0.3849372863769531, 0.6541016101837158, 0.9232654571533203, 1.192429780960083, 1.4615941047668457, 1.7307584285736084, 1.999922752380371, 2.269087076187134, 2.5382513999938965, 2.807415723800659, 3.076580047607422, 3.3457443714141846, 3.6149086952209473, 3.88407301902771, 4.153237342834473, 4.422401428222656, 4.691565990447998, 4.96073055267334, 5.229894638061523, 5.499058723449707, 5.768223285675049, 6.037387847900391, 6.306551933288574, 6.575716018676758, 6.8448805809021, 7.114045143127441, 7.383209228515625, 7.652373313903809, 7.92153787612915, 8.190702438354492, 8.459866523742676, 8.72903060913086, 8.99819564819336, 9.267359733581543, 9.536523818969727]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 10.0, 10.0, 4.0, 12.0, 8.0, 26.0, 23.0, 31.0, 40.0, 47.0, 72.0, 131.0, 194.0, 362.0, 810.0, 2528.0, 10556.0, 112621.0, 4021980.0, 36299.0, 5804.0, 1541.0, 549.0, 261.0, 133.0, 69.0, 49.0, 33.0, 24.0, 13.0, 11.0, 10.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.921875, -3.7833251953125, -3.644775390625, -3.5062255859375, -3.36767578125, -3.2291259765625, -3.090576171875, -2.9520263671875, -2.8134765625, -2.6749267578125, -2.536376953125, -2.3978271484375, -2.25927734375, -2.1207275390625, -1.982177734375, -1.8436279296875, -1.705078125, -1.5665283203125, -1.427978515625, -1.2894287109375, -1.15087890625, -1.0123291015625, -0.873779296875, -0.7352294921875, -0.5966796875, -0.4581298828125, -0.319580078125, -0.1810302734375, -0.04248046875, 0.0960693359375, 0.234619140625, 0.3731689453125, 0.51171875, 0.6502685546875, 0.788818359375, 0.9273681640625, 1.06591796875, 1.2044677734375, 1.343017578125, 1.4815673828125, 1.6201171875, 1.7586669921875, 1.897216796875, 2.0357666015625, 2.17431640625, 2.3128662109375, 2.451416015625, 2.5899658203125, 2.728515625, 2.8670654296875, 3.005615234375, 3.1441650390625, 3.28271484375, 3.4212646484375, 3.559814453125, 3.6983642578125, 3.8369140625, 3.9754638671875, 4.114013671875, 4.2525634765625, 4.39111328125, 4.5296630859375, 4.668212890625, 4.8067626953125, 4.9453125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 8.0, 19.0, 48.0, 56.0, 51.0, 86.0, 95.0, 113.0, 101.0, 107.0, 87.0, 85.0, 56.0, 24.0, 27.0, 12.0, 10.0, 3.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75244140625, -0.7282791137695312, -0.7041168212890625, -0.6799545288085938, -0.655792236328125, -0.6316299438476562, -0.6074676513671875, -0.5833053588867188, -0.55914306640625, -0.5349807739257812, -0.5108184814453125, -0.48665618896484375, -0.462493896484375, -0.43833160400390625, -0.4141693115234375, -0.39000701904296875, -0.3658447265625, -0.34168243408203125, -0.3175201416015625, -0.29335784912109375, -0.269195556640625, -0.24503326416015625, -0.2208709716796875, -0.19670867919921875, -0.17254638671875, -0.14838409423828125, -0.1242218017578125, -0.10005950927734375, -0.075897216796875, -0.05173492431640625, -0.0275726318359375, -0.00341033935546875, 0.020751953125, 0.04491424560546875, 0.0690765380859375, 0.09323883056640625, 0.117401123046875, 0.14156341552734375, 0.1657257080078125, 0.18988800048828125, 0.21405029296875, 0.23821258544921875, 0.2623748779296875, 0.28653717041015625, 0.310699462890625, 0.33486175537109375, 0.3590240478515625, 0.38318634033203125, 0.4073486328125, 0.43151092529296875, 0.4556732177734375, 0.47983551025390625, 0.503997802734375, 0.5281600952148438, 0.5523223876953125, 0.5764846801757812, 0.60064697265625, 0.6248092651367188, 0.6489715576171875, 0.6731338500976562, 0.697296142578125, 0.7214584350585938, 0.7456207275390625, 0.7697830200195312, 0.7939453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 8.0, 9.0, 10.0, 13.0, 22.0, 19.0, 38.0, 44.0, 42.0, 64.0, 102.0, 267.0, 924.0, 4392.0, 33324.0, 3771179.0, 362940.0, 16899.0, 2761.0, 652.0, 221.0, 95.0, 62.0, 35.0, 41.0, 26.0, 21.0, 18.0, 13.0, 14.0, 10.0, 4.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.23046875, -4.112457275390625, -3.99444580078125, -3.876434326171875, -3.7584228515625, -3.640411376953125, -3.52239990234375, -3.404388427734375, -3.286376953125, -3.168365478515625, -3.05035400390625, -2.932342529296875, -2.8143310546875, -2.696319580078125, -2.57830810546875, -2.460296630859375, -2.34228515625, -2.224273681640625, -2.10626220703125, -1.988250732421875, -1.8702392578125, -1.752227783203125, -1.63421630859375, -1.516204833984375, -1.398193359375, -1.280181884765625, -1.16217041015625, -1.044158935546875, -0.9261474609375, -0.808135986328125, -0.69012451171875, -0.572113037109375, -0.4541015625, -0.336090087890625, -0.21807861328125, -0.100067138671875, 0.0179443359375, 0.135955810546875, 0.25396728515625, 0.371978759765625, 0.489990234375, 0.608001708984375, 0.72601318359375, 0.844024658203125, 0.9620361328125, 1.080047607421875, 1.19805908203125, 1.316070556640625, 1.43408203125, 1.552093505859375, 1.67010498046875, 1.788116455078125, 1.9061279296875, 2.024139404296875, 2.14215087890625, 2.260162353515625, 2.378173828125, 2.496185302734375, 2.61419677734375, 2.732208251953125, 2.8502197265625, 2.968231201171875, 3.08624267578125, 3.204254150390625, 3.322265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 6.0, 1.0, 3.0, 5.0, 3.0, 4.0, 12.0, 17.0, 13.0, 14.0, 18.0, 27.0, 34.0, 66.0, 84.0, 131.0, 388.0, 1880.0, 758.0, 214.0, 111.0, 68.0, 55.0, 43.0, 33.0, 24.0, 14.0, 10.0, 8.0, 5.0, 5.0, 6.0, 6.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.4169921875, -0.40079498291015625, -0.3845977783203125, -0.36840057373046875, -0.352203369140625, -0.33600616455078125, -0.3198089599609375, -0.30361175537109375, -0.28741455078125, -0.27121734619140625, -0.2550201416015625, -0.23882293701171875, -0.222625732421875, -0.20642852783203125, -0.1902313232421875, -0.17403411865234375, -0.1578369140625, -0.14163970947265625, -0.1254425048828125, -0.10924530029296875, -0.093048095703125, -0.07685089111328125, -0.0606536865234375, -0.04445648193359375, -0.02825927734375, -0.01206207275390625, 0.0041351318359375, 0.02033233642578125, 0.036529541015625, 0.05272674560546875, 0.0689239501953125, 0.08512115478515625, 0.101318359375, 0.11751556396484375, 0.1337127685546875, 0.14990997314453125, 0.166107177734375, 0.18230438232421875, 0.1985015869140625, 0.21469879150390625, 0.23089599609375, 0.24709320068359375, 0.2632904052734375, 0.27948760986328125, 0.295684814453125, 0.31188201904296875, 0.3280792236328125, 0.34427642822265625, 0.3604736328125, 0.37667083740234375, 0.3928680419921875, 0.40906524658203125, 0.425262451171875, 0.44145965576171875, 0.4576568603515625, 0.47385406494140625, 0.49005126953125, 0.5062484741210938, 0.5224456787109375, 0.5386428833007812, 0.554840087890625, 0.5710372924804688, 0.5872344970703125, 0.6034317016601562, 0.61962890625]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 7.0, 7.0, 17.0, 40.0, 92.0, 187.0, 242.0, 202.0, 97.0, 62.0, 26.0, 6.0, 10.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.459556579589844, -5.267805099487305, -5.076053619384766, -4.884302139282227, -4.6925506591796875, -4.500799179077148, -4.309047698974609, -4.11729621887207, -3.9255447387695312, -3.733793258666992, -3.542041778564453, -3.350290298461914, -3.158538818359375, -2.966787338256836, -2.775035858154297, -2.583284378051758, -2.3915328979492188, -2.1997814178466797, -2.0080299377441406, -1.8162784576416016, -1.6245269775390625, -1.4327754974365234, -1.2410240173339844, -1.0492725372314453, -0.8575210571289062, -0.6657695770263672, -0.4740180969238281, -0.28226661682128906, -0.09051513671875, 0.10123634338378906, 0.2929878234863281, 0.4847393035888672, 0.676490306854248, 0.8682417869567871, 1.0599932670593262, 1.2517447471618652, 1.4434962272644043, 1.6352477073669434, 1.8269991874694824, 2.0187506675720215, 2.2105021476745605, 2.4022536277770996, 2.5940051078796387, 2.7857565879821777, 2.977508068084717, 3.169259548187256, 3.361011028289795, 3.552762508392334, 3.744513988494873, 3.936265468597412, 4.128016948699951, 4.31976842880249, 4.511519908905029, 4.703271389007568, 4.895022869110107, 5.0867743492126465, 5.2785258293151855, 5.470277309417725, 5.662028789520264, 5.853780269622803, 6.045531749725342, 6.237283229827881, 6.42903470993042, 6.620786190032959, 6.812537670135498]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 11.0, 17.0, 27.0, 27.0, 22.0, 34.0, 33.0, 49.0, 43.0, 38.0, 47.0, 55.0, 56.0, 57.0, 44.0, 48.0, 49.0, 41.0, 41.0, 45.0, 30.0, 32.0, 33.0, 17.0, 16.0, 12.0, 12.0, 8.0, 9.0, 4.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9835054874420166, -1.9156304597854614, -1.8477554321289062, -1.7798802852630615, -1.7120052576065063, -1.6441302299499512, -1.5762550830841064, -1.5083800554275513, -1.440505027770996, -1.372630000114441, -1.3047549724578857, -1.236879825592041, -1.1690047979354858, -1.1011297702789307, -1.033254623413086, -0.9653795957565308, -0.8975045680999756, -0.8296295404434204, -0.7617544531822205, -0.6938793659210205, -0.6260043382644653, -0.5581293106079102, -0.4902542233467102, -0.42237916588783264, -0.3545041084289551, -0.2866290509700775, -0.21875399351119995, -0.1508789360523224, -0.08300387859344482, -0.01512882113456726, 0.0527462363243103, 0.12062129378318787, 0.18849635124206543, 0.256371408700943, 0.32424646615982056, 0.3921215236186981, 0.4599965810775757, 0.5278716087341309, 0.5957466959953308, 0.6636217832565308, 0.7314968109130859, 0.7993718385696411, 0.8672469258308411, 0.935122013092041, 1.0029970407485962, 1.0708720684051514, 1.138747215270996, 1.2066222429275513, 1.2744972705841064, 1.3423722982406616, 1.4102473258972168, 1.4781224727630615, 1.5459975004196167, 1.6138725280761719, 1.6817476749420166, 1.7496227025985718, 1.817497730255127, 1.8853727579116821, 1.9532477855682373, 2.021122932434082, 2.0889978408813477, 2.1568729877471924, 2.224748134613037, 2.2926230430603027, 2.3604981899261475]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 9.0, 13.0, 3.0, 10.0, 6.0, 17.0, 18.0, 23.0, 42.0, 58.0, 77.0, 95.0, 124.0, 195.0, 346.0, 489.0, 868.0, 1883.0, 4254.0, 13022.0, 50740.0, 234703.0, 522629.0, 165732.0, 36179.0, 9817.0, 3449.0, 1557.0, 722.0, 437.0, 324.0, 204.0, 143.0, 76.0, 74.0, 45.0, 34.0, 27.0, 26.0, 16.0, 10.0, 12.0, 7.0, 7.0, 6.0, 6.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0], "bins": [-2.392578125, -2.322998046875, -2.25341796875, -2.183837890625, -2.1142578125, -2.044677734375, -1.97509765625, -1.905517578125, -1.8359375, -1.766357421875, -1.69677734375, -1.627197265625, -1.5576171875, -1.488037109375, -1.41845703125, -1.348876953125, -1.279296875, -1.209716796875, -1.14013671875, -1.070556640625, -1.0009765625, -0.931396484375, -0.86181640625, -0.792236328125, -0.72265625, -0.653076171875, -0.58349609375, -0.513916015625, -0.4443359375, -0.374755859375, -0.30517578125, -0.235595703125, -0.166015625, -0.096435546875, -0.02685546875, 0.042724609375, 0.1123046875, 0.181884765625, 0.25146484375, 0.321044921875, 0.390625, 0.460205078125, 0.52978515625, 0.599365234375, 0.6689453125, 0.738525390625, 0.80810546875, 0.877685546875, 0.947265625, 1.016845703125, 1.08642578125, 1.156005859375, 1.2255859375, 1.295166015625, 1.36474609375, 1.434326171875, 1.50390625, 1.573486328125, 1.64306640625, 1.712646484375, 1.7822265625, 1.851806640625, 1.92138671875, 1.990966796875, 2.060546875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 6.0, 13.0, 20.0, 40.0, 67.0, 53.0, 77.0, 106.0, 102.0, 97.0, 107.0, 81.0, 64.0, 69.0, 31.0, 28.0, 20.0, 5.0, 8.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6755599975585938, -0.6523895263671875, -0.6292190551757812, -0.606048583984375, -0.5828781127929688, -0.5597076416015625, -0.5365371704101562, -0.51336669921875, -0.49019622802734375, -0.4670257568359375, -0.44385528564453125, -0.420684814453125, -0.39751434326171875, -0.3743438720703125, -0.35117340087890625, -0.3280029296875, -0.30483245849609375, -0.2816619873046875, -0.25849151611328125, -0.235321044921875, -0.21215057373046875, -0.1889801025390625, -0.16580963134765625, -0.14263916015625, -0.11946868896484375, -0.0962982177734375, -0.07312774658203125, -0.049957275390625, -0.02678680419921875, -0.0036163330078125, 0.01955413818359375, 0.042724609375, 0.06589508056640625, 0.0890655517578125, 0.11223602294921875, 0.135406494140625, 0.15857696533203125, 0.1817474365234375, 0.20491790771484375, 0.22808837890625, 0.25125885009765625, 0.2744293212890625, 0.29759979248046875, 0.320770263671875, 0.34394073486328125, 0.3671112060546875, 0.39028167724609375, 0.4134521484375, 0.43662261962890625, 0.4597930908203125, 0.48296356201171875, 0.506134033203125, 0.5293045043945312, 0.5524749755859375, 0.5756454467773438, 0.59881591796875, 0.6219863891601562, 0.6451568603515625, 0.6683273315429688, 0.691497802734375, 0.7146682739257812, 0.7378387451171875, 0.7610092163085938, 0.7841796875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 20.0, 32.0, 50.0, 81.0, 149.0, 312.0, 571.0, 1270.0, 3115.0, 9343.0, 34425.0, 155192.0, 522550.0, 246722.0, 53522.0, 13803.0, 4308.0, 1623.0, 682.0, 356.0, 196.0, 80.0, 52.0, 25.0, 20.0, 10.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8408203125, -1.7861175537109375, -1.731414794921875, -1.6767120361328125, -1.62200927734375, -1.5673065185546875, -1.512603759765625, -1.4579010009765625, -1.4031982421875, -1.3484954833984375, -1.293792724609375, -1.2390899658203125, -1.18438720703125, -1.1296844482421875, -1.074981689453125, -1.0202789306640625, -0.965576171875, -0.9108734130859375, -0.856170654296875, -0.8014678955078125, -0.74676513671875, -0.6920623779296875, -0.637359619140625, -0.5826568603515625, -0.5279541015625, -0.4732513427734375, -0.418548583984375, -0.3638458251953125, -0.30914306640625, -0.2544403076171875, -0.199737548828125, -0.1450347900390625, -0.09033203125, -0.0356292724609375, 0.019073486328125, 0.0737762451171875, 0.12847900390625, 0.1831817626953125, 0.237884521484375, 0.2925872802734375, 0.3472900390625, 0.4019927978515625, 0.456695556640625, 0.5113983154296875, 0.56610107421875, 0.6208038330078125, 0.675506591796875, 0.7302093505859375, 0.784912109375, 0.8396148681640625, 0.894317626953125, 0.9490203857421875, 1.00372314453125, 1.0584259033203125, 1.113128662109375, 1.1678314208984375, 1.2225341796875, 1.2772369384765625, 1.331939697265625, 1.3866424560546875, 1.44134521484375, 1.4960479736328125, 1.550750732421875, 1.6054534912109375, 1.66015625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 6.0, 19.0, 7.0, 13.0, 26.0, 25.0, 20.0, 36.0, 34.0, 43.0, 45.0, 52.0, 54.0, 47.0, 49.0, 59.0, 50.0, 44.0, 49.0, 51.0, 34.0, 42.0, 47.0, 24.0, 20.0, 18.0, 16.0, 12.0, 13.0, 10.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5439453125, -1.4937286376953125, -1.443511962890625, -1.3932952880859375, -1.34307861328125, -1.2928619384765625, -1.242645263671875, -1.1924285888671875, -1.1422119140625, -1.0919952392578125, -1.041778564453125, -0.9915618896484375, -0.94134521484375, -0.8911285400390625, -0.840911865234375, -0.7906951904296875, -0.740478515625, -0.6902618408203125, -0.640045166015625, -0.5898284912109375, -0.53961181640625, -0.4893951416015625, -0.439178466796875, -0.3889617919921875, -0.3387451171875, -0.2885284423828125, -0.238311767578125, -0.1880950927734375, -0.13787841796875, -0.0876617431640625, -0.037445068359375, 0.0127716064453125, 0.06298828125, 0.1132049560546875, 0.163421630859375, 0.2136383056640625, 0.26385498046875, 0.3140716552734375, 0.364288330078125, 0.4145050048828125, 0.4647216796875, 0.5149383544921875, 0.565155029296875, 0.6153717041015625, 0.66558837890625, 0.7158050537109375, 0.766021728515625, 0.8162384033203125, 0.866455078125, 0.9166717529296875, 0.966888427734375, 1.0171051025390625, 1.06732177734375, 1.1175384521484375, 1.167755126953125, 1.2179718017578125, 1.2681884765625, 1.3184051513671875, 1.368621826171875, 1.4188385009765625, 1.46905517578125, 1.5192718505859375, 1.569488525390625, 1.6197052001953125, 1.669921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 5.0, 6.0, 14.0, 28.0, 39.0, 67.0, 121.0, 302.0, 650.0, 1633.0, 5917.0, 32657.0, 301238.0, 604080.0, 85370.0, 11844.0, 2811.0, 904.0, 413.0, 218.0, 105.0, 50.0, 37.0, 9.0, 10.0, 6.0, 3.0, 3.0, 4.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.138671875, -1.1096420288085938, -1.0806121826171875, -1.0515823364257812, -1.022552490234375, -0.9935226440429688, -0.9644927978515625, -0.9354629516601562, -0.90643310546875, -0.8774032592773438, -0.8483734130859375, -0.8193435668945312, -0.790313720703125, -0.7612838745117188, -0.7322540283203125, -0.7032241821289062, -0.6741943359375, -0.6451644897460938, -0.6161346435546875, -0.5871047973632812, -0.558074951171875, -0.5290451049804688, -0.5000152587890625, -0.47098541259765625, -0.44195556640625, -0.41292572021484375, -0.3838958740234375, -0.35486602783203125, -0.325836181640625, -0.29680633544921875, -0.2677764892578125, -0.23874664306640625, -0.209716796875, -0.18068695068359375, -0.1516571044921875, -0.12262725830078125, -0.093597412109375, -0.06456756591796875, -0.0355377197265625, -0.00650787353515625, 0.02252197265625, 0.05155181884765625, 0.0805816650390625, 0.10961151123046875, 0.138641357421875, 0.16767120361328125, 0.1967010498046875, 0.22573089599609375, 0.2547607421875, 0.28379058837890625, 0.3128204345703125, 0.34185028076171875, 0.370880126953125, 0.39990997314453125, 0.4289398193359375, 0.45796966552734375, 0.48699951171875, 0.5160293579101562, 0.5450592041015625, 0.5740890502929688, 0.603118896484375, 0.6321487426757812, 0.6611785888671875, 0.6902084350585938, 0.71923828125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 6.0, 15.0, 26.0, 37.0, 50.0, 91.0, 124.0, 203.0, 136.0, 95.0, 67.0, 40.0, 36.0, 20.0, 13.0, 13.0, 10.0, 5.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022983551025390625, -0.00022126734256744385, -0.00021269917488098145, -0.00020413100719451904, -0.00019556283950805664, -0.00018699467182159424, -0.00017842650413513184, -0.00016985833644866943, -0.00016129016876220703, -0.00015272200107574463, -0.00014415383338928223, -0.00013558566570281982, -0.00012701749801635742, -0.00011844933032989502, -0.00010988116264343262, -0.00010131299495697021, -9.274482727050781e-05, -8.417665958404541e-05, -7.560849189758301e-05, -6.70403242111206e-05, -5.84721565246582e-05, -4.99039888381958e-05, -4.13358211517334e-05, -3.2767653465270996e-05, -2.4199485778808594e-05, -1.563131809234619e-05, -7.063150405883789e-06, 1.5050172805786133e-06, 1.0073184967041016e-05, 1.8641352653503418e-05, 2.720952033996582e-05, 3.577768802642822e-05, 4.4345855712890625e-05, 5.291402339935303e-05, 6.148219108581543e-05, 7.005035877227783e-05, 7.861852645874023e-05, 8.718669414520264e-05, 9.575486183166504e-05, 0.00010432302951812744, 0.00011289119720458984, 0.00012145936489105225, 0.00013002753257751465, 0.00013859570026397705, 0.00014716386795043945, 0.00015573203563690186, 0.00016430020332336426, 0.00017286837100982666, 0.00018143653869628906, 0.00019000470638275146, 0.00019857287406921387, 0.00020714104175567627, 0.00021570920944213867, 0.00022427737712860107, 0.00023284554481506348, 0.00024141371250152588, 0.0002499818801879883, 0.0002585500478744507, 0.0002671182155609131, 0.0002756863832473755, 0.0002842545509338379, 0.0002928227186203003, 0.0003013908863067627, 0.0003099590539932251, 0.0003185272216796875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 2.0, 6.0, 5.0, 7.0, 12.0, 16.0, 25.0, 54.0, 83.0, 183.0, 301.0, 687.0, 1843.0, 6109.0, 27171.0, 179787.0, 614190.0, 180869.0, 27763.0, 6199.0, 1858.0, 679.0, 335.0, 158.0, 92.0, 40.0, 36.0, 11.0, 7.0, 7.0, 12.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74609375, -0.7199172973632812, -0.6937408447265625, -0.6675643920898438, -0.641387939453125, -0.6152114868164062, -0.5890350341796875, -0.5628585815429688, -0.53668212890625, -0.5105056762695312, -0.4843292236328125, -0.45815277099609375, -0.431976318359375, -0.40579986572265625, -0.3796234130859375, -0.35344696044921875, -0.3272705078125, -0.30109405517578125, -0.2749176025390625, -0.24874114990234375, -0.222564697265625, -0.19638824462890625, -0.1702117919921875, -0.14403533935546875, -0.11785888671875, -0.09168243408203125, -0.0655059814453125, -0.03932952880859375, -0.013153076171875, 0.01302337646484375, 0.0391998291015625, 0.06537628173828125, 0.091552734375, 0.11772918701171875, 0.1439056396484375, 0.17008209228515625, 0.196258544921875, 0.22243499755859375, 0.2486114501953125, 0.27478790283203125, 0.30096435546875, 0.32714080810546875, 0.3533172607421875, 0.37949371337890625, 0.405670166015625, 0.43184661865234375, 0.4580230712890625, 0.48419952392578125, 0.5103759765625, 0.5365524291992188, 0.5627288818359375, 0.5889053344726562, 0.615081787109375, 0.6412582397460938, 0.6674346923828125, 0.6936111450195312, 0.71978759765625, 0.7459640502929688, 0.7721405029296875, 0.7983169555664062, 0.824493408203125, 0.8506698608398438, 0.8768463134765625, 0.9030227661132812, 0.92919921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 4.0, 9.0, 12.0, 14.0, 12.0, 33.0, 32.0, 45.0, 60.0, 65.0, 78.0, 88.0, 81.0, 81.0, 70.0, 69.0, 53.0, 45.0, 33.0, 24.0, 13.0, 16.0, 11.0, 13.0, 10.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4072265625, -0.38994598388671875, -0.3726654052734375, -0.35538482666015625, -0.338104248046875, -0.32082366943359375, -0.3035430908203125, -0.28626251220703125, -0.26898193359375, -0.25170135498046875, -0.2344207763671875, -0.21714019775390625, -0.199859619140625, -0.18257904052734375, -0.1652984619140625, -0.14801788330078125, -0.1307373046875, -0.11345672607421875, -0.0961761474609375, -0.07889556884765625, -0.061614990234375, -0.04433441162109375, -0.0270538330078125, -0.00977325439453125, 0.00750732421875, 0.02478790283203125, 0.0420684814453125, 0.05934906005859375, 0.076629638671875, 0.09391021728515625, 0.1111907958984375, 0.12847137451171875, 0.145751953125, 0.16303253173828125, 0.1803131103515625, 0.19759368896484375, 0.214874267578125, 0.23215484619140625, 0.2494354248046875, 0.26671600341796875, 0.28399658203125, 0.30127716064453125, 0.3185577392578125, 0.33583831787109375, 0.353118896484375, 0.37039947509765625, 0.3876800537109375, 0.40496063232421875, 0.4222412109375, 0.43952178955078125, 0.4568023681640625, 0.47408294677734375, 0.491363525390625, 0.5086441040039062, 0.5259246826171875, 0.5432052612304688, 0.56048583984375, 0.5777664184570312, 0.5950469970703125, 0.6123275756835938, 0.629608154296875, 0.6468887329101562, 0.6641693115234375, 0.6814498901367188, 0.69873046875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 13.0, 59.0, 137.0, 230.0, 264.0, 164.0, 75.0, 29.0, 18.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.69253921508789, -23.037601470947266, -22.38266372680664, -21.727725982666016, -21.07278823852539, -20.417850494384766, -19.76291275024414, -19.107975006103516, -18.45303726196289, -17.798099517822266, -17.14316177368164, -16.488224029541016, -15.83328628540039, -15.178348541259766, -14.52341079711914, -13.868473052978516, -13.21353530883789, -12.558597564697266, -11.90365982055664, -11.248722076416016, -10.59378433227539, -9.938846588134766, -9.28390884399414, -8.628971099853516, -7.974033355712891, -7.319095611572266, -6.664157867431641, -6.009220123291016, -5.354282379150391, -4.699344635009766, -4.044406890869141, -3.3894691467285156, -2.734529495239258, -2.079591751098633, -1.4246540069580078, -0.7697162628173828, -0.11477851867675781, 0.5401592254638672, 1.1950969696044922, 1.8500347137451172, 2.504972457885742, 3.159910202026367, 3.814847946166992, 4.469785690307617, 5.124723434448242, 5.779661178588867, 6.434598922729492, 7.089536666870117, 7.744474411010742, 8.399412155151367, 9.054349899291992, 9.709287643432617, 10.364225387573242, 11.019163131713867, 11.674100875854492, 12.329038619995117, 12.983976364135742, 13.638914108276367, 14.293851852416992, 14.948789596557617, 15.603727340698242, 16.258665084838867, 16.913602828979492, 17.568540573120117, 18.223478317260742]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 6.0, 1.0, 2.0, 9.0, 7.0, 14.0, 15.0, 15.0, 8.0, 20.0, 28.0, 19.0, 26.0, 35.0, 29.0, 32.0, 36.0, 36.0, 49.0, 46.0, 51.0, 43.0, 38.0, 49.0, 42.0, 30.0, 37.0, 30.0, 26.0, 31.0, 37.0, 36.0, 24.0, 20.0, 15.0, 16.0, 13.0, 10.0, 5.0, 3.0, 8.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.390182495117188, -8.146397590637207, -7.902613162994385, -7.658828258514404, -7.415043354034424, -7.171258926391602, -6.927474021911621, -6.683689117431641, -6.43990421295166, -6.19611930847168, -5.952334880828857, -5.708549976348877, -5.4647650718688965, -5.220980644226074, -4.977195739746094, -4.733410835266113, -4.489626407623291, -4.2458415031433105, -4.002057075500488, -3.758272171020508, -3.5144872665405273, -3.270702600479126, -3.0269179344177246, -2.783133029937744, -2.5393483638763428, -2.2955636978149414, -2.051778793334961, -1.8079941272735596, -1.5642093420028687, -1.3204245567321777, -1.0766398906707764, -0.8328551054000854, -0.5890703201293945, -0.345285564661026, -0.10150080919265747, 0.14228391647338867, 0.3860687017440796, 0.6298534870147705, 0.8736381530761719, 1.1174229383468628, 1.3612077236175537, 1.6049925088882446, 1.8487772941589355, 2.092561960220337, 2.3363466262817383, 2.5801315307617188, 2.82391619682312, 3.0677008628845215, 3.311485767364502, 3.5552704334259033, 3.799055337905884, 4.042840003967285, 4.286624908447266, 4.530409812927246, 4.774194240570068, 5.017979145050049, 5.261763572692871, 5.505548477172852, 5.749332904815674, 5.993117809295654, 6.236902713775635, 6.480687141418457, 6.7244720458984375, 6.968256950378418, 7.212041854858398]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 4.0, 3.0, 7.0, 12.0, 9.0, 15.0, 29.0, 46.0, 57.0, 123.0, 175.0, 329.0, 666.0, 1569.0, 5084.0, 28373.0, 3658686.0, 472697.0, 19946.0, 3981.0, 1305.0, 560.0, 270.0, 128.0, 76.0, 45.0, 33.0, 19.0, 12.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.826629638671875, -3.69427490234375, -3.561920166015625, -3.4295654296875, -3.297210693359375, -3.16485595703125, -3.032501220703125, -2.900146484375, -2.767791748046875, -2.63543701171875, -2.503082275390625, -2.3707275390625, -2.238372802734375, -2.10601806640625, -1.973663330078125, -1.84130859375, -1.708953857421875, -1.57659912109375, -1.444244384765625, -1.3118896484375, -1.179534912109375, -1.04718017578125, -0.914825439453125, -0.782470703125, -0.650115966796875, -0.51776123046875, -0.385406494140625, -0.2530517578125, -0.120697021484375, 0.01165771484375, 0.144012451171875, 0.2763671875, 0.408721923828125, 0.54107666015625, 0.673431396484375, 0.8057861328125, 0.938140869140625, 1.07049560546875, 1.202850341796875, 1.335205078125, 1.467559814453125, 1.59991455078125, 1.732269287109375, 1.8646240234375, 1.996978759765625, 2.12933349609375, 2.261688232421875, 2.39404296875, 2.526397705078125, 2.65875244140625, 2.791107177734375, 2.9234619140625, 3.055816650390625, 3.18817138671875, 3.320526123046875, 3.452880859375, 3.585235595703125, 3.71759033203125, 3.849945068359375, 3.9822998046875, 4.114654541015625, 4.24700927734375, 4.379364013671875, 4.51171875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 3.0, 10.0, 22.0, 31.0, 31.0, 53.0, 73.0, 75.0, 83.0, 79.0, 88.0, 86.0, 74.0, 73.0, 71.0, 45.0, 40.0, 23.0, 7.0, 13.0, 10.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6708984375, -0.6480789184570312, -0.6252593994140625, -0.6024398803710938, -0.579620361328125, -0.5568008422851562, -0.5339813232421875, -0.5111618041992188, -0.48834228515625, -0.46552276611328125, -0.4427032470703125, -0.41988372802734375, -0.397064208984375, -0.37424468994140625, -0.3514251708984375, -0.32860565185546875, -0.3057861328125, -0.28296661376953125, -0.2601470947265625, -0.23732757568359375, -0.214508056640625, -0.19168853759765625, -0.1688690185546875, -0.14604949951171875, -0.12322998046875, -0.10041046142578125, -0.0775909423828125, -0.05477142333984375, -0.031951904296875, -0.00913238525390625, 0.0136871337890625, 0.03650665283203125, 0.059326171875, 0.08214569091796875, 0.1049652099609375, 0.12778472900390625, 0.150604248046875, 0.17342376708984375, 0.1962432861328125, 0.21906280517578125, 0.24188232421875, 0.26470184326171875, 0.2875213623046875, 0.31034088134765625, 0.333160400390625, 0.35597991943359375, 0.3787994384765625, 0.40161895751953125, 0.4244384765625, 0.44725799560546875, 0.4700775146484375, 0.49289703369140625, 0.515716552734375, 0.5385360717773438, 0.5613555908203125, 0.5841751098632812, 0.60699462890625, 0.6298141479492188, 0.6526336669921875, 0.6754531860351562, 0.698272705078125, 0.7210922241210938, 0.7439117431640625, 0.7667312622070312, 0.78955078125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 10.0, 6.0, 12.0, 23.0, 30.0, 44.0, 50.0, 81.0, 153.0, 314.0, 734.0, 2467.0, 11269.0, 90503.0, 3885196.0, 180463.0, 17384.0, 3528.0, 1038.0, 427.0, 199.0, 120.0, 76.0, 48.0, 39.0, 18.0, 17.0, 12.0, 7.0, 9.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.642578125, -2.5394287109375, -2.436279296875, -2.3331298828125, -2.22998046875, -2.1268310546875, -2.023681640625, -1.9205322265625, -1.8173828125, -1.7142333984375, -1.611083984375, -1.5079345703125, -1.40478515625, -1.3016357421875, -1.198486328125, -1.0953369140625, -0.9921875, -0.8890380859375, -0.785888671875, -0.6827392578125, -0.57958984375, -0.4764404296875, -0.373291015625, -0.2701416015625, -0.1669921875, -0.0638427734375, 0.039306640625, 0.1424560546875, 0.24560546875, 0.3487548828125, 0.451904296875, 0.5550537109375, 0.658203125, 0.7613525390625, 0.864501953125, 0.9676513671875, 1.07080078125, 1.1739501953125, 1.277099609375, 1.3802490234375, 1.4833984375, 1.5865478515625, 1.689697265625, 1.7928466796875, 1.89599609375, 1.9991455078125, 2.102294921875, 2.2054443359375, 2.30859375, 2.4117431640625, 2.514892578125, 2.6180419921875, 2.72119140625, 2.8243408203125, 2.927490234375, 3.0306396484375, 3.1337890625, 3.2369384765625, 3.340087890625, 3.4432373046875, 3.54638671875, 3.6495361328125, 3.752685546875, 3.8558349609375, 3.958984375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 5.0, 8.0, 7.0, 19.0, 18.0, 25.0, 43.0, 78.0, 107.0, 315.0, 1668.0, 1220.0, 261.0, 111.0, 70.0, 47.0, 19.0, 17.0, 17.0, 4.0, 5.0, 4.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69140625, -0.6584014892578125, -0.625396728515625, -0.5923919677734375, -0.55938720703125, -0.5263824462890625, -0.493377685546875, -0.4603729248046875, -0.4273681640625, -0.3943634033203125, -0.361358642578125, -0.3283538818359375, -0.29534912109375, -0.2623443603515625, -0.229339599609375, -0.1963348388671875, -0.163330078125, -0.1303253173828125, -0.097320556640625, -0.0643157958984375, -0.03131103515625, 0.0016937255859375, 0.034698486328125, 0.0677032470703125, 0.1007080078125, 0.1337127685546875, 0.166717529296875, 0.1997222900390625, 0.23272705078125, 0.2657318115234375, 0.298736572265625, 0.3317413330078125, 0.36474609375, 0.3977508544921875, 0.430755615234375, 0.4637603759765625, 0.49676513671875, 0.5297698974609375, 0.562774658203125, 0.5957794189453125, 0.6287841796875, 0.6617889404296875, 0.694793701171875, 0.7277984619140625, 0.76080322265625, 0.7938079833984375, 0.826812744140625, 0.8598175048828125, 0.892822265625, 0.9258270263671875, 0.958831787109375, 0.9918365478515625, 1.02484130859375, 1.0578460693359375, 1.090850830078125, 1.1238555908203125, 1.1568603515625, 1.1898651123046875, 1.222869873046875, 1.2558746337890625, 1.28887939453125, 1.3218841552734375, 1.354888916015625, 1.3878936767578125, 1.4208984375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 32.0, 53.0, 152.0, 256.0, 267.0, 136.0, 46.0, 25.0, 12.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.701001167297363, -11.407792091369629, -11.114583969116211, -10.821374893188477, -10.528166770935059, -10.234957695007324, -9.941749572753906, -9.648540496826172, -9.355332374572754, -9.06212329864502, -8.768915176391602, -8.475706100463867, -8.18249797821045, -7.889289379119873, -7.596080780029297, -7.3028717041015625, -7.009663105010986, -6.71645450592041, -6.423245906829834, -6.130037307739258, -5.836828708648682, -5.5436201095581055, -5.250411033630371, -4.957202911376953, -4.663993835449219, -4.370785236358643, -4.077576637268066, -3.7843680381774902, -3.491159439086914, -3.197950839996338, -2.9047420024871826, -2.6115334033966064, -2.3183250427246094, -2.025116443634033, -1.731907844543457, -1.4386991262435913, -1.1454905271530151, -0.852281928062439, -0.5590732097625732, -0.26586461067199707, 0.0273439884185791, 0.32055261731147766, 0.6137612462043762, 0.9069699048995972, 1.2001785039901733, 1.4933871030807495, 1.7865958213806152, 2.0798044204711914, 2.3730130195617676, 2.6662216186523438, 2.95943021774292, 3.252638816833496, 3.5458474159240723, 3.8390560150146484, 4.132265090942383, 4.425473213195801, 4.718682289123535, 5.011890888214111, 5.3050994873046875, 5.598308086395264, 5.89151668548584, 6.184725284576416, 6.477933883666992, 6.771142959594727, 7.0643510818481445]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 6.0, 4.0, 6.0, 4.0, 11.0, 9.0, 14.0, 18.0, 26.0, 23.0, 31.0, 30.0, 25.0, 33.0, 35.0, 46.0, 35.0, 53.0, 63.0, 49.0, 53.0, 56.0, 48.0, 49.0, 51.0, 42.0, 29.0, 24.0, 24.0, 19.0, 19.0, 17.0, 14.0, 14.0, 9.0, 3.0, 6.0, 3.0, 7.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.847490668296814, -1.761703372001648, -1.6759161949157715, -1.5901288986206055, -1.5043416023254395, -1.4185543060302734, -1.3327670097351074, -1.246979832649231, -1.161192536354065, -1.075405240058899, -0.9896180033683777, -0.9038307666778564, -0.8180434703826904, -0.7322561740875244, -0.6464689373970032, -0.5606817007064819, -0.4748944044113159, -0.3891071379184723, -0.30331987142562866, -0.21753260493278503, -0.1317453384399414, -0.04595807194709778, 0.03982919454574585, 0.1256164312362671, 0.2114037275314331, 0.29719099402427673, 0.38297826051712036, 0.468765527009964, 0.5545527935028076, 0.6403400897979736, 0.7261273264884949, 0.8119145631790161, 0.8977019786834717, 0.9834892749786377, 1.0692765712738037, 1.1550637483596802, 1.2408510446548462, 1.3266383409500122, 1.4124255180358887, 1.4982128143310547, 1.5840001106262207, 1.6697874069213867, 1.7555747032165527, 1.8413618803024292, 1.9271491765975952, 2.0129363536834717, 2.0987236499786377, 2.1845109462738037, 2.2702982425689697, 2.3560855388641357, 2.4418728351593018, 2.5276601314544678, 2.6134471893310547, 2.6992344856262207, 2.7850217819213867, 2.8708090782165527, 2.9565963745117188, 3.0423836708068848, 3.128170967102051, 3.213958263397217, 3.299745559692383, 3.3855326175689697, 3.4713199138641357, 3.5571072101593018, 3.6428945064544678]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 14.0, 21.0, 48.0, 113.0, 203.0, 546.0, 1661.0, 8540.0, 135251.0, 844902.0, 50455.0, 4939.0, 1113.0, 401.0, 171.0, 81.0, 39.0, 20.0, 10.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.56640625, -5.40435791015625, -5.2423095703125, -5.08026123046875, -4.918212890625, -4.75616455078125, -4.5941162109375, -4.43206787109375, -4.27001953125, -4.10797119140625, -3.9459228515625, -3.78387451171875, -3.621826171875, -3.45977783203125, -3.2977294921875, -3.13568115234375, -2.9736328125, -2.81158447265625, -2.6495361328125, -2.48748779296875, -2.325439453125, -2.16339111328125, -2.0013427734375, -1.83929443359375, -1.67724609375, -1.51519775390625, -1.3531494140625, -1.19110107421875, -1.029052734375, -0.86700439453125, -0.7049560546875, -0.54290771484375, -0.380859375, -0.21881103515625, -0.0567626953125, 0.10528564453125, 0.267333984375, 0.42938232421875, 0.5914306640625, 0.75347900390625, 0.91552734375, 1.07757568359375, 1.2396240234375, 1.40167236328125, 1.563720703125, 1.72576904296875, 1.8878173828125, 2.04986572265625, 2.2119140625, 2.37396240234375, 2.5360107421875, 2.69805908203125, 2.860107421875, 3.02215576171875, 3.1842041015625, 3.34625244140625, 3.50830078125, 3.67034912109375, 3.8323974609375, 3.99444580078125, 4.156494140625, 4.31854248046875, 4.4805908203125, 4.64263916015625, 4.8046875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 7.0, 12.0, 22.0, 28.0, 46.0, 52.0, 64.0, 73.0, 80.0, 81.0, 89.0, 96.0, 78.0, 69.0, 47.0, 49.0, 33.0, 20.0, 22.0, 11.0, 6.0, 7.0, 5.0, 1.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7080078125, -0.684661865234375, -0.66131591796875, -0.637969970703125, -0.6146240234375, -0.591278076171875, -0.56793212890625, -0.544586181640625, -0.521240234375, -0.497894287109375, -0.47454833984375, -0.451202392578125, -0.4278564453125, -0.404510498046875, -0.38116455078125, -0.357818603515625, -0.33447265625, -0.311126708984375, -0.28778076171875, -0.264434814453125, -0.2410888671875, -0.217742919921875, -0.19439697265625, -0.171051025390625, -0.147705078125, -0.124359130859375, -0.10101318359375, -0.077667236328125, -0.0543212890625, -0.030975341796875, -0.00762939453125, 0.015716552734375, 0.0390625, 0.062408447265625, 0.08575439453125, 0.109100341796875, 0.1324462890625, 0.155792236328125, 0.17913818359375, 0.202484130859375, 0.225830078125, 0.249176025390625, 0.27252197265625, 0.295867919921875, 0.3192138671875, 0.342559814453125, 0.36590576171875, 0.389251708984375, 0.41259765625, 0.435943603515625, 0.45928955078125, 0.482635498046875, 0.5059814453125, 0.529327392578125, 0.55267333984375, 0.576019287109375, 0.599365234375, 0.622711181640625, 0.64605712890625, 0.669403076171875, 0.6927490234375, 0.716094970703125, 0.73944091796875, 0.762786865234375, 0.7861328125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 5.0, 12.0, 18.0, 17.0, 30.0, 33.0, 64.0, 77.0, 133.0, 249.0, 479.0, 1019.0, 2490.0, 7051.0, 26291.0, 135516.0, 597034.0, 222732.0, 39377.0, 10017.0, 3149.0, 1307.0, 637.0, 334.0, 167.0, 77.0, 76.0, 51.0, 32.0, 20.0, 19.0, 12.0, 6.0, 2.0, 8.0, 2.0, 0.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.51171875, -1.44775390625, -1.3837890625, -1.31982421875, -1.255859375, -1.19189453125, -1.1279296875, -1.06396484375, -1.0, -0.93603515625, -0.8720703125, -0.80810546875, -0.744140625, -0.68017578125, -0.6162109375, -0.55224609375, -0.48828125, -0.42431640625, -0.3603515625, -0.29638671875, -0.232421875, -0.16845703125, -0.1044921875, -0.04052734375, 0.0234375, 0.08740234375, 0.1513671875, 0.21533203125, 0.279296875, 0.34326171875, 0.4072265625, 0.47119140625, 0.53515625, 0.59912109375, 0.6630859375, 0.72705078125, 0.791015625, 0.85498046875, 0.9189453125, 0.98291015625, 1.046875, 1.11083984375, 1.1748046875, 1.23876953125, 1.302734375, 1.36669921875, 1.4306640625, 1.49462890625, 1.55859375, 1.62255859375, 1.6865234375, 1.75048828125, 1.814453125, 1.87841796875, 1.9423828125, 2.00634765625, 2.0703125, 2.13427734375, 2.1982421875, 2.26220703125, 2.326171875, 2.39013671875, 2.4541015625, 2.51806640625, 2.58203125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 5.0, 5.0, 11.0, 7.0, 7.0, 8.0, 17.0, 11.0, 21.0, 22.0, 23.0, 38.0, 55.0, 41.0, 54.0, 29.0, 52.0, 62.0, 59.0, 43.0, 55.0, 50.0, 44.0, 45.0, 39.0, 39.0, 16.0, 28.0, 25.0, 19.0, 11.0, 10.0, 10.0, 10.0, 8.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7294921875, -1.6722259521484375, -1.614959716796875, -1.5576934814453125, -1.50042724609375, -1.4431610107421875, -1.385894775390625, -1.3286285400390625, -1.2713623046875, -1.2140960693359375, -1.156829833984375, -1.0995635986328125, -1.04229736328125, -0.9850311279296875, -0.927764892578125, -0.8704986572265625, -0.813232421875, -0.7559661865234375, -0.698699951171875, -0.6414337158203125, -0.58416748046875, -0.5269012451171875, -0.469635009765625, -0.4123687744140625, -0.3551025390625, -0.2978363037109375, -0.240570068359375, -0.1833038330078125, -0.12603759765625, -0.0687713623046875, -0.011505126953125, 0.0457611083984375, 0.10302734375, 0.1602935791015625, 0.217559814453125, 0.2748260498046875, 0.33209228515625, 0.3893585205078125, 0.446624755859375, 0.5038909912109375, 0.5611572265625, 0.6184234619140625, 0.675689697265625, 0.7329559326171875, 0.79022216796875, 0.8474884033203125, 0.904754638671875, 0.9620208740234375, 1.019287109375, 1.0765533447265625, 1.133819580078125, 1.1910858154296875, 1.24835205078125, 1.3056182861328125, 1.362884521484375, 1.4201507568359375, 1.4774169921875, 1.5346832275390625, 1.591949462890625, 1.6492156982421875, 1.70648193359375, 1.7637481689453125, 1.821014404296875, 1.8782806396484375, 1.935546875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 10.0, 12.0, 16.0, 40.0, 60.0, 107.0, 227.0, 547.0, 1509.0, 5152.0, 25180.0, 732021.0, 263968.0, 14270.0, 3480.0, 1098.0, 450.0, 206.0, 83.0, 43.0, 36.0, 11.0, 6.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.69921875, -1.64031982421875, -1.5814208984375, -1.52252197265625, -1.463623046875, -1.40472412109375, -1.3458251953125, -1.28692626953125, -1.22802734375, -1.16912841796875, -1.1102294921875, -1.05133056640625, -0.992431640625, -0.93353271484375, -0.8746337890625, -0.81573486328125, -0.7568359375, -0.69793701171875, -0.6390380859375, -0.58013916015625, -0.521240234375, -0.46234130859375, -0.4034423828125, -0.34454345703125, -0.28564453125, -0.22674560546875, -0.1678466796875, -0.10894775390625, -0.050048828125, 0.00885009765625, 0.0677490234375, 0.12664794921875, 0.185546875, 0.24444580078125, 0.3033447265625, 0.36224365234375, 0.421142578125, 0.48004150390625, 0.5389404296875, 0.59783935546875, 0.65673828125, 0.71563720703125, 0.7745361328125, 0.83343505859375, 0.892333984375, 0.95123291015625, 1.0101318359375, 1.06903076171875, 1.1279296875, 1.18682861328125, 1.2457275390625, 1.30462646484375, 1.363525390625, 1.42242431640625, 1.4813232421875, 1.54022216796875, 1.59912109375, 1.65802001953125, 1.7169189453125, 1.77581787109375, 1.834716796875, 1.89361572265625, 1.9525146484375, 2.01141357421875, 2.0703125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 5.0, 5.0, 3.0, 11.0, 15.0, 25.0, 41.0, 93.0, 150.0, 176.0, 192.0, 134.0, 69.0, 31.0, 21.0, 9.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002613067626953125, -0.0002528056502342224, -0.0002443045377731323, -0.00023580342531204224, -0.00022730231285095215, -0.00021880120038986206, -0.00021030008792877197, -0.00020179897546768188, -0.0001932978630065918, -0.0001847967505455017, -0.00017629563808441162, -0.00016779452562332153, -0.00015929341316223145, -0.00015079230070114136, -0.00014229118824005127, -0.00013379007577896118, -0.0001252889633178711, -0.000116787850856781, -0.00010828673839569092, -9.978562593460083e-05, -9.128451347351074e-05, -8.278340101242065e-05, -7.428228855133057e-05, -6.578117609024048e-05, -5.728006362915039e-05, -4.87789511680603e-05, -4.0277838706970215e-05, -3.177672624588013e-05, -2.327561378479004e-05, -1.4774501323699951e-05, -6.273388862609863e-06, 2.2277235984802246e-06, 1.0728836059570312e-05, 1.92299485206604e-05, 2.7731060981750488e-05, 3.6232173442840576e-05, 4.4733285903930664e-05, 5.323439836502075e-05, 6.173551082611084e-05, 7.023662328720093e-05, 7.873773574829102e-05, 8.72388482093811e-05, 9.573996067047119e-05, 0.00010424107313156128, 0.00011274218559265137, 0.00012124329805374146, 0.00012974441051483154, 0.00013824552297592163, 0.00014674663543701172, 0.0001552477478981018, 0.0001637488603591919, 0.00017224997282028198, 0.00018075108528137207, 0.00018925219774246216, 0.00019775331020355225, 0.00020625442266464233, 0.00021475553512573242, 0.0002232566475868225, 0.0002317577600479126, 0.00024025887250900269, 0.0002487599849700928, 0.00025726109743118286, 0.00026576220989227295, 0.00027426332235336304, 0.0002827644348144531]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 6.0, 4.0, 6.0, 7.0, 18.0, 30.0, 40.0, 63.0, 63.0, 106.0, 147.0, 253.0, 531.0, 1941.0, 12450.0, 529216.0, 488293.0, 12039.0, 2008.0, 589.0, 244.0, 153.0, 107.0, 70.0, 48.0, 33.0, 25.0, 15.0, 29.0, 6.0, 6.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5703125, -2.496856689453125, -2.42340087890625, -2.349945068359375, -2.2764892578125, -2.203033447265625, -2.12957763671875, -2.056121826171875, -1.982666015625, -1.909210205078125, -1.83575439453125, -1.762298583984375, -1.6888427734375, -1.615386962890625, -1.54193115234375, -1.468475341796875, -1.39501953125, -1.321563720703125, -1.24810791015625, -1.174652099609375, -1.1011962890625, -1.027740478515625, -0.95428466796875, -0.880828857421875, -0.807373046875, -0.733917236328125, -0.66046142578125, -0.587005615234375, -0.5135498046875, -0.440093994140625, -0.36663818359375, -0.293182373046875, -0.2197265625, -0.146270751953125, -0.07281494140625, 0.000640869140625, 0.0740966796875, 0.147552490234375, 0.22100830078125, 0.294464111328125, 0.367919921875, 0.441375732421875, 0.51483154296875, 0.588287353515625, 0.6617431640625, 0.735198974609375, 0.80865478515625, 0.882110595703125, 0.95556640625, 1.029022216796875, 1.10247802734375, 1.175933837890625, 1.2493896484375, 1.322845458984375, 1.39630126953125, 1.469757080078125, 1.543212890625, 1.616668701171875, 1.69012451171875, 1.763580322265625, 1.8370361328125, 1.910491943359375, 1.98394775390625, 2.057403564453125, 2.130859375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 13.0, 8.0, 26.0, 111.0, 324.0, 342.0, 115.0, 31.0, 20.0, 15.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.263671875, -3.1678466796875, -3.072021484375, -2.9761962890625, -2.88037109375, -2.7845458984375, -2.688720703125, -2.5928955078125, -2.4970703125, -2.4012451171875, -2.305419921875, -2.2095947265625, -2.11376953125, -2.0179443359375, -1.922119140625, -1.8262939453125, -1.73046875, -1.6346435546875, -1.538818359375, -1.4429931640625, -1.34716796875, -1.2513427734375, -1.155517578125, -1.0596923828125, -0.9638671875, -0.8680419921875, -0.772216796875, -0.6763916015625, -0.58056640625, -0.4847412109375, -0.388916015625, -0.2930908203125, -0.197265625, -0.1014404296875, -0.005615234375, 0.0902099609375, 0.18603515625, 0.2818603515625, 0.377685546875, 0.4735107421875, 0.5693359375, 0.6651611328125, 0.760986328125, 0.8568115234375, 0.95263671875, 1.0484619140625, 1.144287109375, 1.2401123046875, 1.3359375, 1.4317626953125, 1.527587890625, 1.6234130859375, 1.71923828125, 1.8150634765625, 1.910888671875, 2.0067138671875, 2.1025390625, 2.1983642578125, 2.294189453125, 2.3900146484375, 2.48583984375, 2.5816650390625, 2.677490234375, 2.7733154296875, 2.869140625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 8.0, 27.0, 102.0, 198.0, 301.0, 206.0, 83.0, 40.0, 18.0, 7.0, 7.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-32.53203201293945, -31.762920379638672, -30.993806838989258, -30.224695205688477, -29.455581665039062, -28.68647003173828, -27.9173583984375, -27.14824676513672, -26.379133224487305, -25.610021591186523, -24.84090805053711, -24.071796417236328, -23.302684783935547, -22.533571243286133, -21.76445960998535, -20.995346069335938, -20.226234436035156, -19.457122802734375, -18.68800926208496, -17.91889762878418, -17.149784088134766, -16.380672454833984, -15.611560821533203, -14.842448234558105, -14.073335647583008, -13.30422306060791, -12.535110473632812, -11.765998840332031, -10.996886253356934, -10.227773666381836, -9.458662033081055, -8.689549446105957, -7.920438766479492, -7.1513261795043945, -6.382214069366455, -5.613101959228516, -4.843989372253418, -4.07487678527832, -3.305764675140381, -2.5366525650024414, -1.7675399780273438, -0.9984276294708252, -0.22931528091430664, 0.5397970676422119, 1.3089094161987305, 2.078021764755249, 2.8471341133117676, 3.616246223449707, 4.385358810424805, 5.154471397399902, 5.923583507537842, 6.692695617675781, 7.461808204650879, 8.230920791625977, 9.000032424926758, 9.769145011901855, 10.538257598876953, 11.30737018585205, 12.076482772827148, 12.84559440612793, 13.614706993103027, 14.383819580078125, 15.152931213378906, 15.922043800354004, 16.6911563873291]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 5.0, 7.0, 8.0, 11.0, 11.0, 8.0, 20.0, 18.0, 12.0, 20.0, 31.0, 32.0, 36.0, 29.0, 43.0, 34.0, 41.0, 44.0, 36.0, 42.0, 38.0, 55.0, 44.0, 38.0, 35.0, 29.0, 38.0, 26.0, 34.0, 29.0, 17.0, 23.0, 16.0, 10.0, 15.0, 13.0, 7.0, 12.0, 11.0, 6.0, 5.0, 5.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.826249122619629, -8.568506240844727, -8.310763359069824, -8.053020477294922, -7.795278072357178, -7.537535190582275, -7.279792785644531, -7.022049903869629, -6.764307022094727, -6.506564140319824, -6.248821258544922, -5.991078853607178, -5.733335971832275, -5.475593090057373, -5.217850685119629, -4.960107803344727, -4.702364921569824, -4.444622039794922, -4.1868791580200195, -3.9291367530822754, -3.671393871307373, -3.4136509895324707, -3.1559083461761475, -2.898165702819824, -2.640422821044922, -2.3826799392700195, -2.1249372959136963, -1.8671945333480835, -1.6094517707824707, -1.351709008216858, -1.0939662456512451, -0.8362234830856323, -0.5784797668457031, -0.32073700428009033, -0.06299424171447754, 0.19474852085113525, 0.45249128341674805, 0.7102340459823608, 0.9679768085479736, 1.2257195711135864, 1.4834623336791992, 1.741205096244812, 1.9989478588104248, 2.256690502166748, 2.5144333839416504, 2.7721762657165527, 3.029918909072876, 3.287661552429199, 3.5454044342041016, 3.803147315979004, 4.060890197753906, 4.31863260269165, 4.576375484466553, 4.834118366241455, 5.091860771179199, 5.349603652954102, 5.607346534729004, 5.865089416503906, 6.122832298278809, 6.380574703216553, 6.638317584991455, 6.896060466766357, 7.153802871704102, 7.411545753479004, 7.669288635253906]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 10.0, 7.0, 7.0, 11.0, 9.0, 20.0, 21.0, 28.0, 54.0, 65.0, 95.0, 130.0, 211.0, 354.0, 642.0, 1289.0, 2981.0, 7963.0, 29932.0, 759884.0, 3340034.0, 35391.0, 8768.0, 3254.0, 1355.0, 694.0, 394.0, 233.0, 151.0, 105.0, 68.0, 25.0, 25.0, 20.0, 11.0, 11.0, 14.0, 1.0, 5.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.314453125, -2.234771728515625, -2.15509033203125, -2.075408935546875, -1.9957275390625, -1.916046142578125, -1.83636474609375, -1.756683349609375, -1.677001953125, -1.597320556640625, -1.51763916015625, -1.437957763671875, -1.3582763671875, -1.278594970703125, -1.19891357421875, -1.119232177734375, -1.03955078125, -0.959869384765625, -0.88018798828125, -0.800506591796875, -0.7208251953125, -0.641143798828125, -0.56146240234375, -0.481781005859375, -0.402099609375, -0.322418212890625, -0.24273681640625, -0.163055419921875, -0.0833740234375, -0.003692626953125, 0.07598876953125, 0.155670166015625, 0.2353515625, 0.315032958984375, 0.39471435546875, 0.474395751953125, 0.5540771484375, 0.633758544921875, 0.71343994140625, 0.793121337890625, 0.872802734375, 0.952484130859375, 1.03216552734375, 1.111846923828125, 1.1915283203125, 1.271209716796875, 1.35089111328125, 1.430572509765625, 1.51025390625, 1.589935302734375, 1.66961669921875, 1.749298095703125, 1.8289794921875, 1.908660888671875, 1.98834228515625, 2.068023681640625, 2.147705078125, 2.227386474609375, 2.30706787109375, 2.386749267578125, 2.4664306640625, 2.546112060546875, 2.62579345703125, 2.705474853515625, 2.78515625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 6.0, 7.0, 19.0, 24.0, 29.0, 36.0, 47.0, 57.0, 60.0, 62.0, 80.0, 77.0, 78.0, 72.0, 78.0, 65.0, 52.0, 38.0, 32.0, 25.0, 11.0, 20.0, 10.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7216796875, -0.6982269287109375, -0.674774169921875, -0.6513214111328125, -0.62786865234375, -0.6044158935546875, -0.580963134765625, -0.5575103759765625, -0.5340576171875, -0.5106048583984375, -0.487152099609375, -0.4636993408203125, -0.44024658203125, -0.4167938232421875, -0.393341064453125, -0.3698883056640625, -0.346435546875, -0.3229827880859375, -0.299530029296875, -0.2760772705078125, -0.25262451171875, -0.2291717529296875, -0.205718994140625, -0.1822662353515625, -0.1588134765625, -0.1353607177734375, -0.111907958984375, -0.0884552001953125, -0.06500244140625, -0.0415496826171875, -0.018096923828125, 0.0053558349609375, 0.02880859375, 0.0522613525390625, 0.075714111328125, 0.0991668701171875, 0.12261962890625, 0.1460723876953125, 0.169525146484375, 0.1929779052734375, 0.2164306640625, 0.2398834228515625, 0.263336181640625, 0.2867889404296875, 0.31024169921875, 0.3336944580078125, 0.357147216796875, 0.3805999755859375, 0.404052734375, 0.4275054931640625, 0.450958251953125, 0.4744110107421875, 0.49786376953125, 0.5213165283203125, 0.544769287109375, 0.5682220458984375, 0.5916748046875, 0.6151275634765625, 0.638580322265625, 0.6620330810546875, 0.68548583984375, 0.7089385986328125, 0.732391357421875, 0.7558441162109375, 0.779296875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [5.0, 8.0, 16.0, 18.0, 20.0, 38.0, 44.0, 64.0, 67.0, 147.0, 1456.0, 4158182.0, 33413.0, 452.0, 99.0, 65.0, 58.0, 39.0, 40.0, 30.0, 11.0, 11.0, 11.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.15625, -5.634033203125, -5.11181640625, -4.589599609375, -4.0673828125, -3.545166015625, -3.02294921875, -2.500732421875, -1.978515625, -1.456298828125, -0.93408203125, -0.411865234375, 0.1103515625, 0.632568359375, 1.15478515625, 1.677001953125, 2.19921875, 2.721435546875, 3.24365234375, 3.765869140625, 4.2880859375, 4.810302734375, 5.33251953125, 5.854736328125, 6.376953125, 6.899169921875, 7.42138671875, 7.943603515625, 8.4658203125, 8.988037109375, 9.51025390625, 10.032470703125, 10.5546875, 11.076904296875, 11.59912109375, 12.121337890625, 12.6435546875, 13.165771484375, 13.68798828125, 14.210205078125, 14.732421875, 15.254638671875, 15.77685546875, 16.299072265625, 16.8212890625, 17.343505859375, 17.86572265625, 18.387939453125, 18.91015625, 19.432373046875, 19.95458984375, 20.476806640625, 20.9990234375, 21.521240234375, 22.04345703125, 22.565673828125, 23.087890625, 23.610107421875, 24.13232421875, 24.654541015625, 25.1767578125, 25.698974609375, 26.22119140625, 26.743408203125, 27.265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 15.0, 45.0, 199.0, 3451.0, 292.0, 57.0, 16.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76904296875, -0.6677322387695312, -0.5664215087890625, -0.46511077880859375, -0.363800048828125, -0.26248931884765625, -0.1611785888671875, -0.05986785888671875, 0.04144287109375, 0.14275360107421875, 0.2440643310546875, 0.34537506103515625, 0.446685791015625, 0.5479965209960938, 0.6493072509765625, 0.7506179809570312, 0.8519287109375, 0.9532394409179688, 1.0545501708984375, 1.1558609008789062, 1.257171630859375, 1.3584823608398438, 1.4597930908203125, 1.5611038208007812, 1.66241455078125, 1.7637252807617188, 1.8650360107421875, 1.9663467407226562, 2.067657470703125, 2.1689682006835938, 2.2702789306640625, 2.3715896606445312, 2.472900390625, 2.5742111206054688, 2.6755218505859375, 2.7768325805664062, 2.878143310546875, 2.9794540405273438, 3.0807647705078125, 3.1820755004882812, 3.28338623046875, 3.3846969604492188, 3.4860076904296875, 3.5873184204101562, 3.688629150390625, 3.7899398803710938, 3.8912506103515625, 3.9925613403320312, 4.0938720703125, 4.195182800292969, 4.2964935302734375, 4.397804260253906, 4.499114990234375, 4.600425720214844, 4.7017364501953125, 4.803047180175781, 4.90435791015625, 5.005668640136719, 5.1069793701171875, 5.208290100097656, 5.309600830078125, 5.410911560058594, 5.5122222900390625, 5.613533020019531, 5.71484375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 14.0, 32.0, 86.0, 211.0, 301.0, 172.0, 88.0, 37.0, 15.0, 13.0, 4.0, 6.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.004982948303223, -8.69827651977539, -8.391570091247559, -8.084863662719727, -7.778156757354736, -7.471450328826904, -7.164743423461914, -6.858036994934082, -6.55133056640625, -6.244624137878418, -5.937917709350586, -5.631210803985596, -5.324504375457764, -5.017797946929932, -4.711091041564941, -4.404384613037109, -4.097678184509277, -3.7909717559814453, -3.484265089035034, -3.177558422088623, -2.870851993560791, -2.564145565032959, -2.257438898086548, -1.9507322311401367, -1.6440258026123047, -1.337319254875183, -1.0306127071380615, -0.7239061594009399, -0.41719961166381836, -0.11049306392669678, 0.1962134838104248, 0.5029201507568359, 0.8096256256103516, 1.1163321733474731, 1.4230387210845947, 1.7297452688217163, 2.036451816558838, 2.34315824508667, 2.649864912033081, 2.956571578979492, 3.263278007507324, 3.5699844360351562, 3.8766911029815674, 4.1833977699279785, 4.4901041984558105, 4.796810626983643, 5.103517532348633, 5.410223960876465, 5.716930389404297, 6.023636817932129, 6.330343246459961, 6.637050151824951, 6.943756580352783, 7.250463008880615, 7.5571699142456055, 7.8638763427734375, 8.17058277130127, 8.477289199829102, 8.783995628356934, 9.090702056884766, 9.397409439086914, 9.704115867614746, 10.010822296142578, 10.31752872467041, 10.624235153198242]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 9.0, 11.0, 17.0, 31.0, 47.0, 60.0, 96.0, 97.0, 87.0, 130.0, 123.0, 96.0, 63.0, 58.0, 23.0, 10.0, 19.0, 7.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.978156089782715, -8.742755889892578, -8.507355690002441, -8.271956443786621, -8.036556243896484, -7.801156044006348, -7.565755844116211, -7.330355644226074, -7.094955921173096, -6.859555721282959, -6.6241559982299805, -6.388755798339844, -6.153355598449707, -5.9179558753967285, -5.682555675506592, -5.447155952453613, -5.211755752563477, -4.97635555267334, -4.740955829620361, -4.505555629730225, -4.270155906677246, -4.034755706787109, -3.7993555068969727, -3.563955545425415, -3.3285555839538574, -3.0931556224823, -2.857755661010742, -2.6223554611206055, -2.386955499649048, -2.1515555381774902, -1.916155457496643, -1.680755376815796, -1.4453554153442383, -1.2099554538726807, -0.9745553731918335, -0.7391553521156311, -0.5037553310394287, -0.2683553695678711, -0.032955288887023926, 0.20244479179382324, 0.43784475326538086, 0.6732447743415833, 0.9086447954177856, 1.1440448760986328, 1.3794448375701904, 1.614844799041748, 1.8502448797225952, 2.0856449604034424, 2.321044921875, 2.5564448833465576, 2.7918448448181152, 3.027245044708252, 3.2626450061798096, 3.498044967651367, 3.733445167541504, 3.9688451290130615, 4.204245090484619, 4.439645290374756, 4.675045013427734, 4.910445213317871, 5.145845413208008, 5.381245136260986, 5.616645336151123, 5.852045059204102, 6.087445259094238]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 8.0, 7.0, 10.0, 9.0, 15.0, 32.0, 54.0, 68.0, 127.0, 255.0, 379.0, 681.0, 1419.0, 3251.0, 8274.0, 27487.0, 120178.0, 507049.0, 294172.0, 59561.0, 15542.0, 5349.0, 2262.0, 1076.0, 528.0, 312.0, 155.0, 97.0, 75.0, 52.0, 24.0, 16.0, 10.0, 8.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.515625, -2.438873291015625, -2.36212158203125, -2.285369873046875, -2.2086181640625, -2.131866455078125, -2.05511474609375, -1.978363037109375, -1.901611328125, -1.824859619140625, -1.74810791015625, -1.671356201171875, -1.5946044921875, -1.517852783203125, -1.44110107421875, -1.364349365234375, -1.28759765625, -1.210845947265625, -1.13409423828125, -1.057342529296875, -0.9805908203125, -0.903839111328125, -0.82708740234375, -0.750335693359375, -0.673583984375, -0.596832275390625, -0.52008056640625, -0.443328857421875, -0.3665771484375, -0.289825439453125, -0.21307373046875, -0.136322021484375, -0.0595703125, 0.017181396484375, 0.09393310546875, 0.170684814453125, 0.2474365234375, 0.324188232421875, 0.40093994140625, 0.477691650390625, 0.554443359375, 0.631195068359375, 0.70794677734375, 0.784698486328125, 0.8614501953125, 0.938201904296875, 1.01495361328125, 1.091705322265625, 1.16845703125, 1.245208740234375, 1.32196044921875, 1.398712158203125, 1.4754638671875, 1.552215576171875, 1.62896728515625, 1.705718994140625, 1.782470703125, 1.859222412109375, 1.93597412109375, 2.012725830078125, 2.0894775390625, 2.166229248046875, 2.24298095703125, 2.319732666015625, 2.396484375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 7.0, 1.0, 8.0, 10.0, 17.0, 14.0, 23.0, 43.0, 39.0, 29.0, 52.0, 58.0, 57.0, 74.0, 76.0, 82.0, 71.0, 55.0, 69.0, 48.0, 49.0, 28.0, 20.0, 21.0, 14.0, 13.0, 11.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.755859375, -0.7313766479492188, -0.7068939208984375, -0.6824111938476562, -0.657928466796875, -0.6334457397460938, -0.6089630126953125, -0.5844802856445312, -0.55999755859375, -0.5355148315429688, -0.5110321044921875, -0.48654937744140625, -0.462066650390625, -0.43758392333984375, -0.4131011962890625, -0.38861846923828125, -0.3641357421875, -0.33965301513671875, -0.3151702880859375, -0.29068756103515625, -0.266204833984375, -0.24172210693359375, -0.2172393798828125, -0.19275665283203125, -0.16827392578125, -0.14379119873046875, -0.1193084716796875, -0.09482574462890625, -0.070343017578125, -0.04586029052734375, -0.0213775634765625, 0.00310516357421875, 0.027587890625, 0.05207061767578125, 0.0765533447265625, 0.10103607177734375, 0.125518798828125, 0.15000152587890625, 0.1744842529296875, 0.19896697998046875, 0.22344970703125, 0.24793243408203125, 0.2724151611328125, 0.29689788818359375, 0.321380615234375, 0.34586334228515625, 0.3703460693359375, 0.39482879638671875, 0.4193115234375, 0.44379425048828125, 0.4682769775390625, 0.49275970458984375, 0.517242431640625, 0.5417251586914062, 0.5662078857421875, 0.5906906127929688, 0.61517333984375, 0.6396560668945312, 0.6641387939453125, 0.6886215209960938, 0.713104248046875, 0.7375869750976562, 0.7620697021484375, 0.7865524291992188, 0.81103515625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 4.0, 5.0, 6.0, 5.0, 7.0, 11.0, 12.0, 25.0, 25.0, 34.0, 48.0, 77.0, 129.0, 212.0, 495.0, 1020.0, 2647.0, 7982.0, 30927.0, 149588.0, 553983.0, 237972.0, 45610.0, 11602.0, 3495.0, 1317.0, 548.0, 307.0, 143.0, 104.0, 68.0, 36.0, 34.0, 20.0, 9.0, 9.0, 11.0, 7.0, 5.0, 3.0, 3.0, 3.0, 8.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.353515625, -2.289276123046875, -2.22503662109375, -2.160797119140625, -2.0965576171875, -2.032318115234375, -1.96807861328125, -1.903839111328125, -1.839599609375, -1.775360107421875, -1.71112060546875, -1.646881103515625, -1.5826416015625, -1.518402099609375, -1.45416259765625, -1.389923095703125, -1.32568359375, -1.261444091796875, -1.19720458984375, -1.132965087890625, -1.0687255859375, -1.004486083984375, -0.94024658203125, -0.876007080078125, -0.811767578125, -0.747528076171875, -0.68328857421875, -0.619049072265625, -0.5548095703125, -0.490570068359375, -0.42633056640625, -0.362091064453125, -0.2978515625, -0.233612060546875, -0.16937255859375, -0.105133056640625, -0.0408935546875, 0.023345947265625, 0.08758544921875, 0.151824951171875, 0.216064453125, 0.280303955078125, 0.34454345703125, 0.408782958984375, 0.4730224609375, 0.537261962890625, 0.60150146484375, 0.665740966796875, 0.72998046875, 0.794219970703125, 0.85845947265625, 0.922698974609375, 0.9869384765625, 1.051177978515625, 1.11541748046875, 1.179656982421875, 1.243896484375, 1.308135986328125, 1.37237548828125, 1.436614990234375, 1.5008544921875, 1.565093994140625, 1.62933349609375, 1.693572998046875, 1.7578125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 6.0, 6.0, 8.0, 13.0, 9.0, 22.0, 25.0, 33.0, 29.0, 32.0, 52.0, 69.0, 53.0, 53.0, 56.0, 47.0, 59.0, 62.0, 40.0, 56.0, 47.0, 47.0, 39.0, 27.0, 26.0, 18.0, 20.0, 9.0, 12.0, 7.0, 13.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.083984375, -3.0080413818359375, -2.932098388671875, -2.8561553955078125, -2.78021240234375, -2.7042694091796875, -2.628326416015625, -2.5523834228515625, -2.4764404296875, -2.4004974365234375, -2.324554443359375, -2.2486114501953125, -2.17266845703125, -2.0967254638671875, -2.020782470703125, -1.9448394775390625, -1.868896484375, -1.7929534912109375, -1.717010498046875, -1.6410675048828125, -1.56512451171875, -1.4891815185546875, -1.413238525390625, -1.3372955322265625, -1.2613525390625, -1.1854095458984375, -1.109466552734375, -1.0335235595703125, -0.95758056640625, -0.8816375732421875, -0.805694580078125, -0.7297515869140625, -0.65380859375, -0.5778656005859375, -0.501922607421875, -0.4259796142578125, -0.35003662109375, -0.2740936279296875, -0.198150634765625, -0.1222076416015625, -0.0462646484375, 0.0296783447265625, 0.105621337890625, 0.1815643310546875, 0.25750732421875, 0.3334503173828125, 0.409393310546875, 0.4853363037109375, 0.561279296875, 0.6372222900390625, 0.713165283203125, 0.7891082763671875, 0.86505126953125, 0.9409942626953125, 1.016937255859375, 1.0928802490234375, 1.1688232421875, 1.2447662353515625, 1.320709228515625, 1.3966522216796875, 1.47259521484375, 1.5485382080078125, 1.624481201171875, 1.7004241943359375, 1.7763671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 1.0, 6.0, 1.0, 6.0, 6.0, 12.0, 12.0, 14.0, 13.0, 27.0, 42.0, 39.0, 80.0, 142.0, 332.0, 676.0, 1652.0, 5202.0, 23753.0, 163964.0, 620137.0, 195502.0, 27823.0, 5874.0, 1781.0, 714.0, 326.0, 145.0, 98.0, 51.0, 39.0, 20.0, 16.0, 15.0, 10.0, 5.0, 7.0, 3.0, 2.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8759765625, -0.84906005859375, -0.8221435546875, -0.79522705078125, -0.768310546875, -0.74139404296875, -0.7144775390625, -0.68756103515625, -0.66064453125, -0.63372802734375, -0.6068115234375, -0.57989501953125, -0.552978515625, -0.52606201171875, -0.4991455078125, -0.47222900390625, -0.4453125, -0.41839599609375, -0.3914794921875, -0.36456298828125, -0.337646484375, -0.31072998046875, -0.2838134765625, -0.25689697265625, -0.22998046875, -0.20306396484375, -0.1761474609375, -0.14923095703125, -0.122314453125, -0.09539794921875, -0.0684814453125, -0.04156494140625, -0.0146484375, 0.01226806640625, 0.0391845703125, 0.06610107421875, 0.093017578125, 0.11993408203125, 0.1468505859375, 0.17376708984375, 0.20068359375, 0.22760009765625, 0.2545166015625, 0.28143310546875, 0.308349609375, 0.33526611328125, 0.3621826171875, 0.38909912109375, 0.416015625, 0.44293212890625, 0.4698486328125, 0.49676513671875, 0.523681640625, 0.55059814453125, 0.5775146484375, 0.60443115234375, 0.63134765625, 0.65826416015625, 0.6851806640625, 0.71209716796875, 0.739013671875, 0.76593017578125, 0.7928466796875, 0.81976318359375, 0.8466796875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 10.0, 13.0, 16.0, 13.0, 32.0, 31.0, 61.0, 66.0, 82.0, 94.0, 120.0, 112.0, 94.0, 78.0, 49.0, 29.0, 23.0, 17.0, 15.0, 9.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020265579223632812, -0.00019738450646400452, -0.0001921132206916809, -0.0001868419349193573, -0.0001815706491470337, -0.00017629936337471008, -0.00017102807760238647, -0.00016575679183006287, -0.00016048550605773926, -0.00015521422028541565, -0.00014994293451309204, -0.00014467164874076843, -0.00013940036296844482, -0.00013412907719612122, -0.0001288577914237976, -0.000123586505651474, -0.00011831521987915039, -0.00011304393410682678, -0.00010777264833450317, -0.00010250136256217957, -9.723007678985596e-05, -9.195879101753235e-05, -8.668750524520874e-05, -8.141621947288513e-05, -7.614493370056152e-05, -7.087364792823792e-05, -6.56023621559143e-05, -6.03310763835907e-05, -5.505979061126709e-05, -4.978850483894348e-05, -4.451721906661987e-05, -3.9245933294296265e-05, -3.3974647521972656e-05, -2.8703361749649048e-05, -2.343207597732544e-05, -1.816079020500183e-05, -1.2889504432678223e-05, -7.618218660354614e-06, -2.346932888031006e-06, 2.9243528842926025e-06, 8.195638656616211e-06, 1.346692442893982e-05, 1.8738210201263428e-05, 2.4009495973587036e-05, 2.9280781745910645e-05, 3.455206751823425e-05, 3.982335329055786e-05, 4.509463906288147e-05, 5.036592483520508e-05, 5.5637210607528687e-05, 6.0908496379852295e-05, 6.61797821521759e-05, 7.145106792449951e-05, 7.672235369682312e-05, 8.199363946914673e-05, 8.726492524147034e-05, 9.253621101379395e-05, 9.780749678611755e-05, 0.00010307878255844116, 0.00010835006833076477, 0.00011362135410308838, 0.00011889263987541199, 0.0001241639256477356, 0.0001294352114200592, 0.0001347064971923828]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 4.0, 9.0, 7.0, 9.0, 20.0, 22.0, 44.0, 44.0, 72.0, 108.0, 174.0, 285.0, 496.0, 900.0, 1911.0, 4977.0, 19636.0, 118945.0, 620754.0, 233993.0, 33405.0, 7523.0, 2556.0, 1151.0, 531.0, 364.0, 213.0, 139.0, 80.0, 56.0, 38.0, 19.0, 21.0, 12.0, 8.0, 6.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.85595703125, -0.8280410766601562, -0.8001251220703125, -0.7722091674804688, -0.744293212890625, -0.7163772583007812, -0.6884613037109375, -0.6605453491210938, -0.63262939453125, -0.6047134399414062, -0.5767974853515625, -0.5488815307617188, -0.520965576171875, -0.49304962158203125, -0.4651336669921875, -0.43721771240234375, -0.4093017578125, -0.38138580322265625, -0.3534698486328125, -0.32555389404296875, -0.297637939453125, -0.26972198486328125, -0.2418060302734375, -0.21389007568359375, -0.18597412109375, -0.15805816650390625, -0.1301422119140625, -0.10222625732421875, -0.074310302734375, -0.04639434814453125, -0.0184783935546875, 0.00943756103515625, 0.037353515625, 0.06526947021484375, 0.0931854248046875, 0.12110137939453125, 0.149017333984375, 0.17693328857421875, 0.2048492431640625, 0.23276519775390625, 0.26068115234375, 0.28859710693359375, 0.3165130615234375, 0.34442901611328125, 0.372344970703125, 0.40026092529296875, 0.4281768798828125, 0.45609283447265625, 0.4840087890625, 0.5119247436523438, 0.5398406982421875, 0.5677566528320312, 0.595672607421875, 0.6235885620117188, 0.6515045166015625, 0.6794204711914062, 0.70733642578125, 0.7352523803710938, 0.7631683349609375, 0.7910842895507812, 0.819000244140625, 0.8469161987304688, 0.8748321533203125, 0.9027481079101562, 0.9306640625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 2.0, 5.0, 13.0, 18.0, 29.0, 45.0, 86.0, 129.0, 158.0, 146.0, 137.0, 100.0, 50.0, 21.0, 27.0, 12.0, 7.0, 5.0, 0.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4814453125, -1.444427490234375, -1.40740966796875, -1.370391845703125, -1.3333740234375, -1.296356201171875, -1.25933837890625, -1.222320556640625, -1.185302734375, -1.148284912109375, -1.11126708984375, -1.074249267578125, -1.0372314453125, -1.000213623046875, -0.96319580078125, -0.926177978515625, -0.88916015625, -0.852142333984375, -0.81512451171875, -0.778106689453125, -0.7410888671875, -0.704071044921875, -0.66705322265625, -0.630035400390625, -0.593017578125, -0.555999755859375, -0.51898193359375, -0.481964111328125, -0.4449462890625, -0.407928466796875, -0.37091064453125, -0.333892822265625, -0.296875, -0.259857177734375, -0.22283935546875, -0.185821533203125, -0.1488037109375, -0.111785888671875, -0.07476806640625, -0.037750244140625, -0.000732421875, 0.036285400390625, 0.07330322265625, 0.110321044921875, 0.1473388671875, 0.184356689453125, 0.22137451171875, 0.258392333984375, 0.29541015625, 0.332427978515625, 0.36944580078125, 0.406463623046875, 0.4434814453125, 0.480499267578125, 0.51751708984375, 0.554534912109375, 0.591552734375, 0.628570556640625, 0.66558837890625, 0.702606201171875, 0.7396240234375, 0.776641845703125, 0.81365966796875, 0.850677490234375, 0.8876953125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 16.0, 52.0, 132.0, 270.0, 316.0, 147.0, 45.0, 19.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.400753021240234, -41.51872253417969, -40.636688232421875, -39.75465774536133, -38.872623443603516, -37.99059295654297, -37.108558654785156, -36.22652816772461, -35.3444938659668, -34.46246337890625, -33.58042907714844, -32.69839859008789, -31.816364288330078, -30.9343318939209, -30.05229949951172, -29.170269012451172, -28.288236618041992, -27.406204223632812, -26.524171829223633, -25.642139434814453, -24.760107040405273, -23.878074645996094, -22.996044158935547, -22.114009857177734, -21.231979370117188, -20.349946975708008, -19.467914581298828, -18.58588218688965, -17.70384979248047, -16.82181739807129, -15.939785957336426, -15.057753562927246, -14.175718307495117, -13.293685913085938, -12.411653518676758, -11.529621124267578, -10.647588729858398, -9.765556335449219, -8.883524894714355, -8.001492500305176, -7.119460105895996, -6.237427711486816, -5.355395317077637, -4.473363399505615, -3.5913310050964355, -2.709298610687256, -1.8272666931152344, -0.9452342987060547, -0.063201904296875, 0.8188303709030151, 1.7008626461029053, 2.582894802093506, 3.4649271965026855, 4.346959590911865, 5.228991508483887, 6.111023902893066, 6.993056297302246, 7.875088691711426, 8.757121086120605, 9.639152526855469, 10.521184921264648, 11.403217315673828, 12.285249710083008, 13.167282104492188, 14.049314498901367]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 4.0, 5.0, 12.0, 8.0, 12.0, 14.0, 15.0, 8.0, 23.0, 23.0, 17.0, 25.0, 21.0, 43.0, 37.0, 36.0, 41.0, 46.0, 41.0, 39.0, 43.0, 41.0, 45.0, 43.0, 48.0, 37.0, 46.0, 39.0, 40.0, 25.0, 16.0, 18.0, 20.0, 11.0, 9.0, 9.0, 6.0, 7.0, 3.0, 12.0, 4.0, 3.0, 6.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.691396713256836, -9.39731502532959, -9.103233337402344, -8.809151649475098, -8.515069961547852, -8.220988273620605, -7.926906108856201, -7.632824420928955, -7.338742733001709, -7.044661045074463, -6.750579357147217, -6.456497669219971, -6.162415504455566, -5.86833381652832, -5.574252128601074, -5.280170440673828, -4.986088752746582, -4.692007064819336, -4.39792537689209, -4.103843688964844, -3.8097617626190186, -3.5156800746917725, -3.2215981483459473, -2.927516460418701, -2.633434772491455, -2.339353084564209, -2.045271396636963, -1.7511894702911377, -1.4571077823638916, -1.1630260944366455, -0.8689442873001099, -0.5748624801635742, -0.2807798385620117, 0.01330190896987915, 0.30738365650177, 0.6014654040336609, 0.8955471515655518, 1.1896288394927979, 1.4837106466293335, 1.7777924537658691, 2.0718741416931152, 2.3659558296203613, 2.6600375175476074, 2.9541194438934326, 3.2482011318206787, 3.542282819747925, 3.83636474609375, 4.130446434020996, 4.424528121948242, 4.718609809875488, 5.012691497802734, 5.3067731857299805, 5.600854873657227, 5.894936561584473, 6.189018726348877, 6.483100414276123, 6.777182102203369, 7.071263790130615, 7.365345478057861, 7.659427165985107, 7.953509330749512, 8.247591018676758, 8.541672706604004, 8.83575439453125, 9.129836082458496]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 7.0, 14.0, 14.0, 19.0, 29.0, 54.0, 72.0, 125.0, 189.0, 280.0, 573.0, 1022.0, 2400.0, 9090.0, 108452.0, 4040755.0, 23548.0, 4301.0, 1527.0, 801.0, 366.0, 222.0, 129.0, 75.0, 68.0, 37.0, 26.0, 21.0, 17.0, 18.0, 9.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.8046875, -5.62469482421875, -5.4447021484375, -5.26470947265625, -5.084716796875, -4.90472412109375, -4.7247314453125, -4.54473876953125, -4.36474609375, -4.18475341796875, -4.0047607421875, -3.82476806640625, -3.644775390625, -3.46478271484375, -3.2847900390625, -3.10479736328125, -2.9248046875, -2.74481201171875, -2.5648193359375, -2.38482666015625, -2.204833984375, -2.02484130859375, -1.8448486328125, -1.66485595703125, -1.48486328125, -1.30487060546875, -1.1248779296875, -0.94488525390625, -0.764892578125, -0.58489990234375, -0.4049072265625, -0.22491455078125, -0.044921875, 0.13507080078125, 0.3150634765625, 0.49505615234375, 0.675048828125, 0.85504150390625, 1.0350341796875, 1.21502685546875, 1.39501953125, 1.57501220703125, 1.7550048828125, 1.93499755859375, 2.114990234375, 2.29498291015625, 2.4749755859375, 2.65496826171875, 2.8349609375, 3.01495361328125, 3.1949462890625, 3.37493896484375, 3.554931640625, 3.73492431640625, 3.9149169921875, 4.09490966796875, 4.27490234375, 4.45489501953125, 4.6348876953125, 4.81488037109375, 4.994873046875, 5.17486572265625, 5.3548583984375, 5.53485107421875, 5.71484375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 6.0, 8.0, 15.0, 13.0, 12.0, 19.0, 33.0, 31.0, 36.0, 36.0, 42.0, 60.0, 44.0, 61.0, 71.0, 73.0, 74.0, 84.0, 53.0, 38.0, 43.0, 32.0, 32.0, 25.0, 11.0, 10.0, 14.0, 11.0, 10.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76708984375, -0.7423629760742188, -0.7176361083984375, -0.6929092407226562, -0.668182373046875, -0.6434555053710938, -0.6187286376953125, -0.5940017700195312, -0.56927490234375, -0.5445480346679688, -0.5198211669921875, -0.49509429931640625, -0.470367431640625, -0.44564056396484375, -0.4209136962890625, -0.39618682861328125, -0.3714599609375, -0.34673309326171875, -0.3220062255859375, -0.29727935791015625, -0.272552490234375, -0.24782562255859375, -0.2230987548828125, -0.19837188720703125, -0.17364501953125, -0.14891815185546875, -0.1241912841796875, -0.09946441650390625, -0.074737548828125, -0.05001068115234375, -0.0252838134765625, -0.00055694580078125, 0.024169921875, 0.04889678955078125, 0.0736236572265625, 0.09835052490234375, 0.123077392578125, 0.14780426025390625, 0.1725311279296875, 0.19725799560546875, 0.22198486328125, 0.24671173095703125, 0.2714385986328125, 0.29616546630859375, 0.320892333984375, 0.34561920166015625, 0.3703460693359375, 0.39507293701171875, 0.4197998046875, 0.44452667236328125, 0.4692535400390625, 0.49398040771484375, 0.518707275390625, 0.5434341430664062, 0.5681610107421875, 0.5928878784179688, 0.61761474609375, 0.6423416137695312, 0.6670684814453125, 0.6917953491210938, 0.716522216796875, 0.7412490844726562, 0.7659759521484375, 0.7907028198242188, 0.8154296875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 18.0, 24.0, 32.0, 38.0, 60.0, 88.0, 134.0, 206.0, 354.0, 730.0, 2054.0, 8560.0, 90601.0, 4035399.0, 47006.0, 5925.0, 1550.0, 591.0, 299.0, 195.0, 110.0, 97.0, 48.0, 52.0, 24.0, 19.0, 20.0, 15.0, 14.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0546875, -3.89501953125, -3.7353515625, -3.57568359375, -3.416015625, -3.25634765625, -3.0966796875, -2.93701171875, -2.77734375, -2.61767578125, -2.4580078125, -2.29833984375, -2.138671875, -1.97900390625, -1.8193359375, -1.65966796875, -1.5, -1.34033203125, -1.1806640625, -1.02099609375, -0.861328125, -0.70166015625, -0.5419921875, -0.38232421875, -0.22265625, -0.06298828125, 0.0966796875, 0.25634765625, 0.416015625, 0.57568359375, 0.7353515625, 0.89501953125, 1.0546875, 1.21435546875, 1.3740234375, 1.53369140625, 1.693359375, 1.85302734375, 2.0126953125, 2.17236328125, 2.33203125, 2.49169921875, 2.6513671875, 2.81103515625, 2.970703125, 3.13037109375, 3.2900390625, 3.44970703125, 3.609375, 3.76904296875, 3.9287109375, 4.08837890625, 4.248046875, 4.40771484375, 4.5673828125, 4.72705078125, 4.88671875, 5.04638671875, 5.2060546875, 5.36572265625, 5.525390625, 5.68505859375, 5.8447265625, 6.00439453125, 6.1640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 4.0, 9.0, 21.0, 32.0, 43.0, 84.0, 325.0, 3008.0, 328.0, 100.0, 41.0, 25.0, 14.0, 5.0, 9.0, 5.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.98876953125, -0.9406051635742188, -0.8924407958984375, -0.8442764282226562, -0.796112060546875, -0.7479476928710938, -0.6997833251953125, -0.6516189575195312, -0.60345458984375, -0.5552902221679688, -0.5071258544921875, -0.45896148681640625, -0.410797119140625, -0.36263275146484375, -0.3144683837890625, -0.26630401611328125, -0.2181396484375, -0.16997528076171875, -0.1218109130859375, -0.07364654541015625, -0.025482177734375, 0.02268218994140625, 0.0708465576171875, 0.11901092529296875, 0.16717529296875, 0.21533966064453125, 0.2635040283203125, 0.31166839599609375, 0.359832763671875, 0.40799713134765625, 0.4561614990234375, 0.5043258666992188, 0.552490234375, 0.6006546020507812, 0.6488189697265625, 0.6969833374023438, 0.745147705078125, 0.7933120727539062, 0.8414764404296875, 0.8896408081054688, 0.93780517578125, 0.9859695434570312, 1.0341339111328125, 1.0822982788085938, 1.130462646484375, 1.1786270141601562, 1.2267913818359375, 1.2749557495117188, 1.3231201171875, 1.3712844848632812, 1.4194488525390625, 1.4676132202148438, 1.515777587890625, 1.5639419555664062, 1.6121063232421875, 1.6602706909179688, 1.70843505859375, 1.7565994262695312, 1.8047637939453125, 1.8529281616210938, 1.901092529296875, 1.9492568969726562, 1.9974212646484375, 2.0455856323242188, 2.09375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 6.0, 7.0, 9.0, 27.0, 80.0, 206.0, 292.0, 203.0, 80.0, 39.0, 20.0, 7.0, 6.0, 5.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.679243087768555, -8.42022705078125, -8.161211967468262, -7.902196407318115, -7.643180847167969, -7.384164810180664, -7.125149250030518, -6.866133689880371, -6.607118129730225, -6.348102569580078, -6.089087009429932, -5.830071449279785, -5.5710554122924805, -5.312040328979492, -5.0530242919921875, -4.794008731842041, -4.5349931716918945, -4.275977611541748, -4.016962051391602, -3.757946252822876, -3.4989306926727295, -3.239915132522583, -2.9808993339538574, -2.721883773803711, -2.4628682136535645, -2.203852653503418, -1.944836974143982, -1.685821294784546, -1.4268057346343994, -1.167790174484253, -0.9087744951248169, -0.6497588157653809, -0.39074230194091797, -0.1317266821861267, 0.12728893756866455, 0.3863045573234558, 0.6453201770782471, 0.9043357372283936, 1.1633514165878296, 1.4223670959472656, 1.681382656097412, 1.9403982162475586, 2.199413776397705, 2.4584295749664307, 2.717445135116577, 2.9764606952667236, 3.235476493835449, 3.4944920539855957, 3.753507614135742, 4.012523174285889, 4.271538734436035, 4.530554294586182, 4.789569854736328, 5.048585891723633, 5.307601451873779, 5.566617012023926, 5.825632572174072, 6.084648132324219, 6.343663692474365, 6.602679252624512, 6.861695289611816, 7.120710372924805, 7.379726409912109, 7.638741970062256, 7.897757530212402]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 10.0, 12.0, 11.0, 19.0, 12.0, 26.0, 28.0, 36.0, 29.0, 37.0, 35.0, 50.0, 48.0, 40.0, 41.0, 52.0, 41.0, 54.0, 43.0, 46.0, 41.0, 36.0, 38.0, 42.0, 22.0, 21.0, 22.0, 10.0, 20.0, 11.0, 9.0, 11.0, 8.0, 10.0, 5.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.408156156539917, -2.320138931274414, -2.232121706008911, -2.144104480743408, -2.0560872554779053, -1.9680700302124023, -1.8800526857376099, -1.792035460472107, -1.704018235206604, -1.616001009941101, -1.5279837846755981, -1.4399664402008057, -1.3519492149353027, -1.2639319896697998, -1.1759147644042969, -1.087897539138794, -0.999880313873291, -0.9118630886077881, -0.8238458633422852, -0.7358285784721375, -0.6478113532066345, -0.5597941279411316, -0.4717768430709839, -0.38375961780548096, -0.295742392539978, -0.2077251523733139, -0.11970791220664978, -0.03169065713882446, 0.05632656812667847, 0.1443437933921814, 0.2323610782623291, 0.32037830352783203, 0.40839529037475586, 0.4964125156402588, 0.5844297409057617, 0.6724470257759094, 0.7604642510414124, 0.8484814763069153, 0.936498761177063, 1.024515986442566, 1.1125332117080688, 1.2005504369735718, 1.2885676622390747, 1.3765850067138672, 1.4646022319793701, 1.552619457244873, 1.640636682510376, 1.728653907775879, 1.8166711330413818, 1.9046883583068848, 1.9927055835723877, 2.0807228088378906, 2.1687400341033936, 2.2567572593688965, 2.3447747230529785, 2.4327917098999023, 2.5208091735839844, 2.6088263988494873, 2.6968436241149902, 2.784860849380493, 2.872878074645996, 2.960895299911499, 3.048912525177002, 3.136929988861084, 3.224946975708008]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 8.0, 8.0, 10.0, 13.0, 25.0, 36.0, 51.0, 73.0, 119.0, 149.0, 220.0, 390.0, 632.0, 1085.0, 2112.0, 4044.0, 8314.0, 18033.0, 43638.0, 109973.0, 276326.0, 333333.0, 147849.0, 56918.0, 23745.0, 10456.0, 5033.0, 2569.0, 1329.0, 753.0, 511.0, 289.0, 160.0, 120.0, 75.0, 48.0, 38.0, 20.0, 15.0, 10.0, 11.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.8564453125, -1.8036346435546875, -1.750823974609375, -1.6980133056640625, -1.64520263671875, -1.5923919677734375, -1.539581298828125, -1.4867706298828125, -1.4339599609375, -1.3811492919921875, -1.328338623046875, -1.2755279541015625, -1.22271728515625, -1.1699066162109375, -1.117095947265625, -1.0642852783203125, -1.011474609375, -0.9586639404296875, -0.905853271484375, -0.8530426025390625, -0.80023193359375, -0.7474212646484375, -0.694610595703125, -0.6417999267578125, -0.5889892578125, -0.5361785888671875, -0.483367919921875, -0.4305572509765625, -0.37774658203125, -0.3249359130859375, -0.272125244140625, -0.2193145751953125, -0.16650390625, -0.1136932373046875, -0.060882568359375, -0.0080718994140625, 0.04473876953125, 0.0975494384765625, 0.150360107421875, 0.2031707763671875, 0.2559814453125, 0.3087921142578125, 0.361602783203125, 0.4144134521484375, 0.46722412109375, 0.5200347900390625, 0.572845458984375, 0.6256561279296875, 0.678466796875, 0.7312774658203125, 0.784088134765625, 0.8368988037109375, 0.88970947265625, 0.9425201416015625, 0.995330810546875, 1.0481414794921875, 1.1009521484375, 1.1537628173828125, 1.206573486328125, 1.2593841552734375, 1.31219482421875, 1.3650054931640625, 1.417816162109375, 1.4706268310546875, 1.5234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 10.0, 13.0, 9.0, 14.0, 18.0, 26.0, 34.0, 27.0, 37.0, 43.0, 60.0, 50.0, 72.0, 64.0, 74.0, 65.0, 55.0, 71.0, 58.0, 36.0, 34.0, 23.0, 25.0, 16.0, 23.0, 11.0, 6.0, 9.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7607421875, -0.7346115112304688, -0.7084808349609375, -0.6823501586914062, -0.656219482421875, -0.6300888061523438, -0.6039581298828125, -0.5778274536132812, -0.55169677734375, -0.5255661010742188, -0.4994354248046875, -0.47330474853515625, -0.447174072265625, -0.42104339599609375, -0.3949127197265625, -0.36878204345703125, -0.3426513671875, -0.31652069091796875, -0.2903900146484375, -0.26425933837890625, -0.238128662109375, -0.21199798583984375, -0.1858673095703125, -0.15973663330078125, -0.13360595703125, -0.10747528076171875, -0.0813446044921875, -0.05521392822265625, -0.029083251953125, -0.00295257568359375, 0.0231781005859375, 0.04930877685546875, 0.075439453125, 0.10157012939453125, 0.1277008056640625, 0.15383148193359375, 0.179962158203125, 0.20609283447265625, 0.2322235107421875, 0.25835418701171875, 0.28448486328125, 0.31061553955078125, 0.3367462158203125, 0.36287689208984375, 0.389007568359375, 0.41513824462890625, 0.4412689208984375, 0.46739959716796875, 0.4935302734375, 0.5196609497070312, 0.5457916259765625, 0.5719223022460938, 0.598052978515625, 0.6241836547851562, 0.6503143310546875, 0.6764450073242188, 0.70257568359375, 0.7287063598632812, 0.7548370361328125, 0.7809677124023438, 0.807098388671875, 0.8332290649414062, 0.8593597412109375, 0.8854904174804688, 0.91162109375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 3.0, 6.0, 7.0, 11.0, 17.0, 22.0, 28.0, 59.0, 127.0, 200.0, 416.0, 728.0, 1485.0, 3511.0, 8320.0, 23133.0, 76371.0, 279763.0, 433784.0, 154057.0, 42461.0, 14101.0, 5287.0, 2340.0, 1063.0, 551.0, 290.0, 160.0, 93.0, 53.0, 25.0, 20.0, 19.0, 17.0, 11.0, 3.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.529296875, -1.47320556640625, -1.4171142578125, -1.36102294921875, -1.304931640625, -1.24884033203125, -1.1927490234375, -1.13665771484375, -1.08056640625, -1.02447509765625, -0.9683837890625, -0.91229248046875, -0.856201171875, -0.80010986328125, -0.7440185546875, -0.68792724609375, -0.6318359375, -0.57574462890625, -0.5196533203125, -0.46356201171875, -0.407470703125, -0.35137939453125, -0.2952880859375, -0.23919677734375, -0.18310546875, -0.12701416015625, -0.0709228515625, -0.01483154296875, 0.041259765625, 0.09735107421875, 0.1534423828125, 0.20953369140625, 0.265625, 0.32171630859375, 0.3778076171875, 0.43389892578125, 0.489990234375, 0.54608154296875, 0.6021728515625, 0.65826416015625, 0.71435546875, 0.77044677734375, 0.8265380859375, 0.88262939453125, 0.938720703125, 0.99481201171875, 1.0509033203125, 1.10699462890625, 1.1630859375, 1.21917724609375, 1.2752685546875, 1.33135986328125, 1.387451171875, 1.44354248046875, 1.4996337890625, 1.55572509765625, 1.61181640625, 1.66790771484375, 1.7239990234375, 1.78009033203125, 1.836181640625, 1.89227294921875, 1.9483642578125, 2.00445556640625, 2.060546875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 2.0, 3.0, 5.0, 5.0, 11.0, 10.0, 14.0, 11.0, 20.0, 23.0, 22.0, 22.0, 24.0, 28.0, 32.0, 46.0, 38.0, 55.0, 48.0, 53.0, 39.0, 57.0, 36.0, 49.0, 50.0, 31.0, 33.0, 38.0, 33.0, 23.0, 10.0, 23.0, 19.0, 12.0, 6.0, 11.0, 12.0, 9.0, 6.0, 5.0, 1.0, 1.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.458984375, -2.38092041015625, -2.3028564453125, -2.22479248046875, -2.146728515625, -2.06866455078125, -1.9906005859375, -1.91253662109375, -1.83447265625, -1.75640869140625, -1.6783447265625, -1.60028076171875, -1.522216796875, -1.44415283203125, -1.3660888671875, -1.28802490234375, -1.2099609375, -1.13189697265625, -1.0538330078125, -0.97576904296875, -0.897705078125, -0.81964111328125, -0.7415771484375, -0.66351318359375, -0.58544921875, -0.50738525390625, -0.4293212890625, -0.35125732421875, -0.273193359375, -0.19512939453125, -0.1170654296875, -0.03900146484375, 0.0390625, 0.11712646484375, 0.1951904296875, 0.27325439453125, 0.351318359375, 0.42938232421875, 0.5074462890625, 0.58551025390625, 0.66357421875, 0.74163818359375, 0.8197021484375, 0.89776611328125, 0.975830078125, 1.05389404296875, 1.1319580078125, 1.21002197265625, 1.2880859375, 1.36614990234375, 1.4442138671875, 1.52227783203125, 1.600341796875, 1.67840576171875, 1.7564697265625, 1.83453369140625, 1.91259765625, 1.99066162109375, 2.0687255859375, 2.14678955078125, 2.224853515625, 2.30291748046875, 2.3809814453125, 2.45904541015625, 2.537109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 9.0, 15.0, 21.0, 36.0, 68.0, 163.0, 440.0, 1511.0, 8782.0, 145186.0, 826755.0, 58880.0, 5050.0, 1029.0, 313.0, 147.0, 62.0, 42.0, 11.0, 11.0, 11.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.359375, -1.3057861328125, -1.252197265625, -1.1986083984375, -1.14501953125, -1.0914306640625, -1.037841796875, -0.9842529296875, -0.9306640625, -0.8770751953125, -0.823486328125, -0.7698974609375, -0.71630859375, -0.6627197265625, -0.609130859375, -0.5555419921875, -0.501953125, -0.4483642578125, -0.394775390625, -0.3411865234375, -0.28759765625, -0.2340087890625, -0.180419921875, -0.1268310546875, -0.0732421875, -0.0196533203125, 0.033935546875, 0.0875244140625, 0.14111328125, 0.1947021484375, 0.248291015625, 0.3018798828125, 0.35546875, 0.4090576171875, 0.462646484375, 0.5162353515625, 0.56982421875, 0.6234130859375, 0.677001953125, 0.7305908203125, 0.7841796875, 0.8377685546875, 0.891357421875, 0.9449462890625, 0.99853515625, 1.0521240234375, 1.105712890625, 1.1593017578125, 1.212890625, 1.2664794921875, 1.320068359375, 1.3736572265625, 1.42724609375, 1.4808349609375, 1.534423828125, 1.5880126953125, 1.6416015625, 1.6951904296875, 1.748779296875, 1.8023681640625, 1.85595703125, 1.9095458984375, 1.963134765625, 2.0167236328125, 2.0703125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 3.0, 4.0, 4.0, 3.0, 7.0, 6.0, 7.0, 19.0, 11.0, 13.0, 22.0, 28.0, 41.0, 38.0, 38.0, 45.0, 66.0, 61.0, 75.0, 67.0, 49.0, 69.0, 51.0, 38.0, 47.0, 38.0, 35.0, 10.0, 19.0, 18.0, 12.0, 13.0, 9.0, 11.0, 7.0, 5.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.00012683868408203125, -0.00012334156781435013, -0.000119844451546669, -0.00011634733527898788, -0.00011285021901130676, -0.00010935310274362564, -0.00010585598647594452, -0.0001023588702082634, -9.886175394058228e-05, -9.536463767290115e-05, -9.186752140522003e-05, -8.837040513753891e-05, -8.487328886985779e-05, -8.137617260217667e-05, -7.787905633449554e-05, -7.438194006681442e-05, -7.08848237991333e-05, -6.738770753145218e-05, -6.389059126377106e-05, -6.0393474996089935e-05, -5.6896358728408813e-05, -5.339924246072769e-05, -4.990212619304657e-05, -4.640500992536545e-05, -4.2907893657684326e-05, -3.9410777390003204e-05, -3.591366112232208e-05, -3.241654485464096e-05, -2.891942858695984e-05, -2.5422312319278717e-05, -2.1925196051597595e-05, -1.8428079783916473e-05, -1.4930963516235352e-05, -1.143384724855423e-05, -7.936730980873108e-06, -4.439614713191986e-06, -9.424984455108643e-07, 2.5546178221702576e-06, 6.051734089851379e-06, 9.548850357532501e-06, 1.3045966625213623e-05, 1.6543082892894745e-05, 2.0040199160575867e-05, 2.353731542825699e-05, 2.703443169593811e-05, 3.053154796361923e-05, 3.4028664231300354e-05, 3.7525780498981476e-05, 4.10228967666626e-05, 4.452001303434372e-05, 4.801712930202484e-05, 5.151424556970596e-05, 5.5011361837387085e-05, 5.850847810506821e-05, 6.200559437274933e-05, 6.550271064043045e-05, 6.899982690811157e-05, 7.24969431757927e-05, 7.599405944347382e-05, 7.949117571115494e-05, 8.298829197883606e-05, 8.648540824651718e-05, 8.99825245141983e-05, 9.347964078187943e-05, 9.697675704956055e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 10.0, 7.0, 12.0, 9.0, 22.0, 27.0, 60.0, 69.0, 160.0, 263.0, 462.0, 932.0, 2443.0, 9221.0, 55483.0, 438261.0, 465497.0, 60943.0, 9901.0, 2615.0, 1033.0, 463.0, 251.0, 148.0, 92.0, 55.0, 46.0, 28.0, 11.0, 15.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.03515625, -0.9982147216796875, -0.961273193359375, -0.9243316650390625, -0.88739013671875, -0.8504486083984375, -0.813507080078125, -0.7765655517578125, -0.7396240234375, -0.7026824951171875, -0.665740966796875, -0.6287994384765625, -0.59185791015625, -0.5549163818359375, -0.517974853515625, -0.4810333251953125, -0.444091796875, -0.4071502685546875, -0.370208740234375, -0.3332672119140625, -0.29632568359375, -0.2593841552734375, -0.222442626953125, -0.1855010986328125, -0.1485595703125, -0.1116180419921875, -0.074676513671875, -0.0377349853515625, -0.00079345703125, 0.0361480712890625, 0.073089599609375, 0.1100311279296875, 0.14697265625, 0.1839141845703125, 0.220855712890625, 0.2577972412109375, 0.29473876953125, 0.3316802978515625, 0.368621826171875, 0.4055633544921875, 0.4425048828125, 0.4794464111328125, 0.516387939453125, 0.5533294677734375, 0.59027099609375, 0.6272125244140625, 0.664154052734375, 0.7010955810546875, 0.738037109375, 0.7749786376953125, 0.811920166015625, 0.8488616943359375, 0.88580322265625, 0.9227447509765625, 0.959686279296875, 0.9966278076171875, 1.0335693359375, 1.0705108642578125, 1.107452392578125, 1.1443939208984375, 1.18133544921875, 1.2182769775390625, 1.255218505859375, 1.2921600341796875, 1.3291015625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 9.0, 8.0, 11.0, 18.0, 26.0, 34.0, 47.0, 59.0, 85.0, 105.0, 109.0, 113.0, 87.0, 83.0, 55.0, 49.0, 29.0, 24.0, 13.0, 13.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7115402221679688, -0.6735687255859375, -0.6355972290039062, -0.597625732421875, -0.5596542358398438, -0.5216827392578125, -0.48371124267578125, -0.44573974609375, -0.40776824951171875, -0.3697967529296875, -0.33182525634765625, -0.293853759765625, -0.25588226318359375, -0.2179107666015625, -0.17993927001953125, -0.1419677734375, -0.10399627685546875, -0.0660247802734375, -0.02805328369140625, 0.009918212890625, 0.04788970947265625, 0.0858612060546875, 0.12383270263671875, 0.16180419921875, 0.19977569580078125, 0.2377471923828125, 0.27571868896484375, 0.313690185546875, 0.35166168212890625, 0.3896331787109375, 0.42760467529296875, 0.465576171875, 0.5035476684570312, 0.5415191650390625, 0.5794906616210938, 0.617462158203125, 0.6554336547851562, 0.6934051513671875, 0.7313766479492188, 0.76934814453125, 0.8073196411132812, 0.8452911376953125, 0.8832626342773438, 0.921234130859375, 0.9592056274414062, 0.9971771240234375, 1.0351486206054688, 1.0731201171875, 1.1110916137695312, 1.1490631103515625, 1.1870346069335938, 1.225006103515625, 1.2629776000976562, 1.3009490966796875, 1.3389205932617188, 1.37689208984375, 1.4148635864257812, 1.4528350830078125, 1.4908065795898438, 1.528778076171875, 1.5667495727539062, 1.6047210693359375, 1.6426925659179688, 1.6806640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 14.0, 27.0, 70.0, 142.0, 222.0, 226.0, 149.0, 74.0, 35.0, 19.0, 14.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.87394714355469, -38.03001403808594, -37.18607711791992, -36.34214401245117, -35.498207092285156, -34.654273986816406, -33.81033706665039, -32.96640396118164, -32.122467041015625, -31.278532028198242, -30.43459701538086, -29.590662002563477, -28.746726989746094, -27.90279197692871, -27.058856964111328, -26.214923858642578, -25.370988845825195, -24.527053833007812, -23.68311882019043, -22.839183807373047, -21.995248794555664, -21.15131378173828, -20.30738067626953, -19.463443756103516, -18.619510650634766, -17.775575637817383, -16.931640625, -16.087705612182617, -15.243770599365234, -14.399835586547852, -13.555901527404785, -12.711966514587402, -11.868029594421387, -11.024094581604004, -10.180159568786621, -9.336225509643555, -8.492290496826172, -7.648355007171631, -6.804420471191406, -5.960485458374023, -5.116550445556641, -4.272615432739258, -3.428680658340454, -2.5847458839416504, -1.7408108711242676, -0.8968758583068848, -0.052941322326660156, 0.7909936904907227, 1.6349287033081055, 2.4788637161254883, 3.322798490524292, 4.166733264923096, 5.0106682777404785, 5.854603290557861, 6.698537826538086, 7.542472839355469, 8.386407852172852, 9.230342864990234, 10.074277877807617, 10.918212890625, 11.762147903442383, 12.606082916259766, 13.450016975402832, 14.293951988220215, 15.137887001037598]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 6.0, 2.0, 8.0, 7.0, 16.0, 10.0, 16.0, 14.0, 20.0, 18.0, 18.0, 24.0, 33.0, 23.0, 36.0, 25.0, 42.0, 34.0, 31.0, 43.0, 66.0, 37.0, 49.0, 43.0, 34.0, 49.0, 44.0, 28.0, 31.0, 28.0, 26.0, 21.0, 25.0, 22.0, 12.0, 11.0, 13.0, 8.0, 4.0, 7.0, 8.0, 6.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.963959693908691, -13.517277717590332, -13.070594787597656, -12.623912811279297, -12.177230834960938, -11.730547904968262, -11.283865928649902, -10.837182998657227, -10.390501022338867, -9.943819046020508, -9.497136116027832, -9.050454139709473, -8.603771209716797, -8.157089233398438, -7.710407257080078, -7.2637248039245605, -6.817042350769043, -6.370359897613525, -5.923677444458008, -5.476995468139648, -5.030313014984131, -4.583630561828613, -4.136948585510254, -3.6902661323547363, -3.2435836791992188, -2.796901226043701, -2.3502190113067627, -1.9035366773605347, -1.4568543434143066, -1.010171890258789, -0.5634896755218506, -0.11680746078491211, 0.32987403869628906, 0.7765563726425171, 1.2232387065887451, 1.6699210405349731, 2.116603374481201, 2.5632858276367188, 3.0099680423736572, 3.4566502571105957, 3.9033327102661133, 4.350015163421631, 4.796697616577148, 5.243379592895508, 5.690062046051025, 6.136744499206543, 6.583426475524902, 7.03010892868042, 7.4767913818359375, 7.923473834991455, 8.370156288146973, 8.816838264465332, 9.263521194458008, 9.710203170776367, 10.156885147094727, 10.603567123413086, 11.050250053405762, 11.496932029724121, 11.943614959716797, 12.390296936035156, 12.836978912353516, 13.283661842346191, 13.73034381866455, 14.177026748657227, 14.623708724975586]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 12.0, 14.0, 16.0, 33.0, 72.0, 109.0, 218.0, 447.0, 1026.0, 2453.0, 6505.0, 23609.0, 317859.0, 3794804.0, 33538.0, 8261.0, 2872.0, 1225.0, 535.0, 285.0, 154.0, 91.0, 51.0, 27.0, 18.0, 15.0, 16.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.958984375, -3.818145751953125, -3.67730712890625, -3.536468505859375, -3.3956298828125, -3.254791259765625, -3.11395263671875, -2.973114013671875, -2.832275390625, -2.691436767578125, -2.55059814453125, -2.409759521484375, -2.2689208984375, -2.128082275390625, -1.98724365234375, -1.846405029296875, -1.70556640625, -1.564727783203125, -1.42388916015625, -1.283050537109375, -1.1422119140625, -1.001373291015625, -0.86053466796875, -0.719696044921875, -0.578857421875, -0.438018798828125, -0.29718017578125, -0.156341552734375, -0.0155029296875, 0.125335693359375, 0.26617431640625, 0.407012939453125, 0.5478515625, 0.688690185546875, 0.82952880859375, 0.970367431640625, 1.1112060546875, 1.252044677734375, 1.39288330078125, 1.533721923828125, 1.674560546875, 1.815399169921875, 1.95623779296875, 2.097076416015625, 2.2379150390625, 2.378753662109375, 2.51959228515625, 2.660430908203125, 2.80126953125, 2.942108154296875, 3.08294677734375, 3.223785400390625, 3.3646240234375, 3.505462646484375, 3.64630126953125, 3.787139892578125, 3.927978515625, 4.068817138671875, 4.20965576171875, 4.350494384765625, 4.4913330078125, 4.632171630859375, 4.77301025390625, 4.913848876953125, 5.0546875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 5.0, 8.0, 7.0, 7.0, 11.0, 10.0, 19.0, 18.0, 29.0, 32.0, 27.0, 36.0, 39.0, 46.0, 54.0, 59.0, 37.0, 49.0, 56.0, 53.0, 48.0, 49.0, 49.0, 38.0, 35.0, 33.0, 31.0, 26.0, 21.0, 14.0, 15.0, 11.0, 8.0, 11.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.75830078125, -0.732208251953125, -0.70611572265625, -0.680023193359375, -0.6539306640625, -0.627838134765625, -0.60174560546875, -0.575653076171875, -0.549560546875, -0.523468017578125, -0.49737548828125, -0.471282958984375, -0.4451904296875, -0.419097900390625, -0.39300537109375, -0.366912841796875, -0.3408203125, -0.314727783203125, -0.28863525390625, -0.262542724609375, -0.2364501953125, -0.210357666015625, -0.18426513671875, -0.158172607421875, -0.132080078125, -0.105987548828125, -0.07989501953125, -0.053802490234375, -0.0277099609375, -0.001617431640625, 0.02447509765625, 0.050567626953125, 0.07666015625, 0.102752685546875, 0.12884521484375, 0.154937744140625, 0.1810302734375, 0.207122802734375, 0.23321533203125, 0.259307861328125, 0.285400390625, 0.311492919921875, 0.33758544921875, 0.363677978515625, 0.3897705078125, 0.415863037109375, 0.44195556640625, 0.468048095703125, 0.494140625, 0.520233154296875, 0.54632568359375, 0.572418212890625, 0.5985107421875, 0.624603271484375, 0.65069580078125, 0.676788330078125, 0.702880859375, 0.728973388671875, 0.75506591796875, 0.781158447265625, 0.8072509765625, 0.833343505859375, 0.85943603515625, 0.885528564453125, 0.91162109375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 6.0, 8.0, 4.0, 10.0, 19.0, 16.0, 14.0, 25.0, 30.0, 57.0, 91.0, 131.0, 233.0, 484.0, 1410.0, 8361.0, 165201.0, 3994259.0, 19791.0, 2715.0, 638.0, 299.0, 154.0, 85.0, 62.0, 57.0, 43.0, 22.0, 23.0, 15.0, 4.0, 13.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.84991455078125, -7.6060791015625, -7.36224365234375, -7.118408203125, -6.87457275390625, -6.6307373046875, -6.38690185546875, -6.14306640625, -5.89923095703125, -5.6553955078125, -5.41156005859375, -5.167724609375, -4.92388916015625, -4.6800537109375, -4.43621826171875, -4.1923828125, -3.94854736328125, -3.7047119140625, -3.46087646484375, -3.217041015625, -2.97320556640625, -2.7293701171875, -2.48553466796875, -2.24169921875, -1.99786376953125, -1.7540283203125, -1.51019287109375, -1.266357421875, -1.02252197265625, -0.7786865234375, -0.53485107421875, -0.291015625, -0.04718017578125, 0.1966552734375, 0.44049072265625, 0.684326171875, 0.92816162109375, 1.1719970703125, 1.41583251953125, 1.65966796875, 1.90350341796875, 2.1473388671875, 2.39117431640625, 2.635009765625, 2.87884521484375, 3.1226806640625, 3.36651611328125, 3.6103515625, 3.85418701171875, 4.0980224609375, 4.34185791015625, 4.585693359375, 4.82952880859375, 5.0733642578125, 5.31719970703125, 5.56103515625, 5.80487060546875, 6.0487060546875, 6.29254150390625, 6.536376953125, 6.78021240234375, 7.0240478515625, 7.26788330078125, 7.51171875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 6.0, 14.0, 23.0, 78.0, 398.0, 3370.0, 107.0, 39.0, 18.0, 10.0, 12.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6328125, -6.47943115234375, -6.3260498046875, -6.17266845703125, -6.019287109375, -5.86590576171875, -5.7125244140625, -5.55914306640625, -5.40576171875, -5.25238037109375, -5.0989990234375, -4.94561767578125, -4.792236328125, -4.63885498046875, -4.4854736328125, -4.33209228515625, -4.1787109375, -4.02532958984375, -3.8719482421875, -3.71856689453125, -3.565185546875, -3.41180419921875, -3.2584228515625, -3.10504150390625, -2.95166015625, -2.79827880859375, -2.6448974609375, -2.49151611328125, -2.338134765625, -2.18475341796875, -2.0313720703125, -1.87799072265625, -1.724609375, -1.57122802734375, -1.4178466796875, -1.26446533203125, -1.111083984375, -0.95770263671875, -0.8043212890625, -0.65093994140625, -0.49755859375, -0.34417724609375, -0.1907958984375, -0.03741455078125, 0.115966796875, 0.26934814453125, 0.4227294921875, 0.57611083984375, 0.7294921875, 0.88287353515625, 1.0362548828125, 1.18963623046875, 1.343017578125, 1.49639892578125, 1.6497802734375, 1.80316162109375, 1.95654296875, 2.10992431640625, 2.2633056640625, 2.41668701171875, 2.570068359375, 2.72344970703125, 2.8768310546875, 3.03021240234375, 3.18359375]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 13.0, 12.0, 26.0, 50.0, 127.0, 215.0, 233.0, 162.0, 94.0, 24.0, 20.0, 11.0, 5.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.202736854553223, -13.814584732055664, -13.426431655883789, -13.03827953338623, -12.650127410888672, -12.261974334716797, -11.873822212219238, -11.48567008972168, -11.097517013549805, -10.709364891052246, -10.321211814880371, -9.933059692382812, -9.544907569885254, -9.156755447387695, -8.76860237121582, -8.380450248718262, -7.992298126220703, -7.604145526885986, -7.215993404388428, -6.827840805053711, -6.439688682556152, -6.0515360832214355, -5.663383483886719, -5.27523136138916, -4.887078762054443, -4.498926162719727, -4.110774040222168, -3.722621440887451, -3.3344690799713135, -2.946316719055176, -2.558164119720459, -2.1700117588043213, -1.7818593978881836, -1.393707036972046, -1.0055545568466187, -0.6174020767211914, -0.2292497158050537, 0.15890264511108398, 0.5470552444458008, 0.9352076053619385, 1.3233599662780762, 1.7115123271942139, 2.0996646881103516, 2.4878172874450684, 2.875969648361206, 3.2641220092773438, 3.6522746086120605, 4.040427207946777, 4.428579330444336, 4.816731929779053, 5.204884052276611, 5.593036651611328, 5.981188774108887, 6.3693413734436035, 6.75749397277832, 7.145646095275879, 7.533798694610596, 7.9219512939453125, 8.310103416442871, 8.69825553894043, 9.086408615112305, 9.474560737609863, 9.862712860107422, 10.250865936279297, 10.639018058776855]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 2.0, 8.0, 6.0, 11.0, 10.0, 13.0, 12.0, 19.0, 16.0, 12.0, 24.0, 22.0, 26.0, 29.0, 32.0, 29.0, 53.0, 41.0, 32.0, 37.0, 30.0, 33.0, 42.0, 40.0, 33.0, 31.0, 36.0, 28.0, 30.0, 26.0, 25.0, 30.0, 22.0, 23.0, 14.0, 20.0, 21.0, 16.0, 7.0, 8.0, 8.0, 6.0, 8.0, 7.0, 5.0, 3.0, 0.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0], "bins": [-4.551063537597656, -4.4028449058532715, -4.254626274108887, -4.106407165527344, -3.958188533782959, -3.809969902038574, -3.6617512702941895, -3.5135326385498047, -3.365313768386841, -3.217095136642456, -3.068876266479492, -2.9206576347351074, -2.7724390029907227, -2.624220132827759, -2.476001501083374, -2.32778263092041, -2.1795639991760254, -2.0313453674316406, -1.8831264972686768, -1.734907865524292, -1.5866891145706177, -1.4384703636169434, -1.2902517318725586, -1.1420329809188843, -0.99381422996521, -0.8455954790115356, -0.6973767876625061, -0.5491580963134766, -0.40093934535980225, -0.25272059440612793, -0.10450190305709839, 0.04371678829193115, 0.19193506240844727, 0.3401537835597992, 0.4883725047111511, 0.6365911960601807, 0.784809947013855, 0.9330286979675293, 1.081247329711914, 1.2294660806655884, 1.3776848316192627, 1.525903582572937, 1.6741223335266113, 1.822340965270996, 1.9705597162246704, 2.1187784671783447, 2.2669970989227295, 2.4152159690856934, 2.563434600830078, 2.711653232574463, 2.8598721027374268, 3.0080907344818115, 3.1563096046447754, 3.30452823638916, 3.452746868133545, 3.6009654998779297, 3.7491843700408936, 3.8974030017852783, 4.045621871948242, 4.193840503692627, 4.342059135437012, 4.490278244018555, 4.6384968757629395, 4.786715507507324, 4.934934139251709]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 1.0, 5.0, 11.0, 14.0, 13.0, 30.0, 51.0, 67.0, 110.0, 174.0, 259.0, 499.0, 854.0, 1555.0, 3009.0, 6157.0, 13235.0, 31359.0, 85823.0, 264259.0, 399074.0, 151931.0, 51674.0, 20268.0, 8906.0, 4321.0, 2129.0, 1125.0, 627.0, 370.0, 228.0, 130.0, 80.0, 54.0, 49.0, 32.0, 23.0, 12.0, 17.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.68359375, -2.605255126953125, -2.52691650390625, -2.448577880859375, -2.3702392578125, -2.291900634765625, -2.21356201171875, -2.135223388671875, -2.056884765625, -1.978546142578125, -1.90020751953125, -1.821868896484375, -1.7435302734375, -1.665191650390625, -1.58685302734375, -1.508514404296875, -1.43017578125, -1.351837158203125, -1.27349853515625, -1.195159912109375, -1.1168212890625, -1.038482666015625, -0.96014404296875, -0.881805419921875, -0.803466796875, -0.725128173828125, -0.64678955078125, -0.568450927734375, -0.4901123046875, -0.411773681640625, -0.33343505859375, -0.255096435546875, -0.1767578125, -0.098419189453125, -0.02008056640625, 0.058258056640625, 0.1365966796875, 0.214935302734375, 0.29327392578125, 0.371612548828125, 0.449951171875, 0.528289794921875, 0.60662841796875, 0.684967041015625, 0.7633056640625, 0.841644287109375, 0.91998291015625, 0.998321533203125, 1.07666015625, 1.154998779296875, 1.23333740234375, 1.311676025390625, 1.3900146484375, 1.468353271484375, 1.54669189453125, 1.625030517578125, 1.703369140625, 1.781707763671875, 1.86004638671875, 1.938385009765625, 2.0167236328125, 2.095062255859375, 2.17340087890625, 2.251739501953125, 2.330078125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 1.0, 6.0, 6.0, 9.0, 12.0, 9.0, 16.0, 13.0, 19.0, 20.0, 17.0, 13.0, 33.0, 38.0, 30.0, 35.0, 46.0, 39.0, 49.0, 47.0, 42.0, 52.0, 47.0, 44.0, 42.0, 34.0, 40.0, 27.0, 35.0, 33.0, 21.0, 17.0, 14.0, 20.0, 21.0, 10.0, 7.0, 9.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.73828125, -0.712677001953125, -0.68707275390625, -0.661468505859375, -0.6358642578125, -0.610260009765625, -0.58465576171875, -0.559051513671875, -0.533447265625, -0.507843017578125, -0.48223876953125, -0.456634521484375, -0.4310302734375, -0.405426025390625, -0.37982177734375, -0.354217529296875, -0.32861328125, -0.303009033203125, -0.27740478515625, -0.251800537109375, -0.2261962890625, -0.200592041015625, -0.17498779296875, -0.149383544921875, -0.123779296875, -0.098175048828125, -0.07257080078125, -0.046966552734375, -0.0213623046875, 0.004241943359375, 0.02984619140625, 0.055450439453125, 0.0810546875, 0.106658935546875, 0.13226318359375, 0.157867431640625, 0.1834716796875, 0.209075927734375, 0.23468017578125, 0.260284423828125, 0.285888671875, 0.311492919921875, 0.33709716796875, 0.362701416015625, 0.3883056640625, 0.413909912109375, 0.43951416015625, 0.465118408203125, 0.49072265625, 0.516326904296875, 0.54193115234375, 0.567535400390625, 0.5931396484375, 0.618743896484375, 0.64434814453125, 0.669952392578125, 0.695556640625, 0.721160888671875, 0.74676513671875, 0.772369384765625, 0.7979736328125, 0.823577880859375, 0.84918212890625, 0.874786376953125, 0.900390625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 7.0, 8.0, 2.0, 10.0, 14.0, 14.0, 18.0, 27.0, 46.0, 64.0, 105.0, 166.0, 300.0, 575.0, 1107.0, 2627.0, 7015.0, 21832.0, 91464.0, 513198.0, 328334.0, 57189.0, 15341.0, 5089.0, 2030.0, 908.0, 419.0, 246.0, 120.0, 79.0, 57.0, 48.0, 26.0, 21.0, 14.0, 10.0, 6.0, 8.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.4921875, -3.378997802734375, -3.26580810546875, -3.152618408203125, -3.0394287109375, -2.926239013671875, -2.81304931640625, -2.699859619140625, -2.586669921875, -2.473480224609375, -2.36029052734375, -2.247100830078125, -2.1339111328125, -2.020721435546875, -1.90753173828125, -1.794342041015625, -1.68115234375, -1.567962646484375, -1.45477294921875, -1.341583251953125, -1.2283935546875, -1.115203857421875, -1.00201416015625, -0.888824462890625, -0.775634765625, -0.662445068359375, -0.54925537109375, -0.436065673828125, -0.3228759765625, -0.209686279296875, -0.09649658203125, 0.016693115234375, 0.1298828125, 0.243072509765625, 0.35626220703125, 0.469451904296875, 0.5826416015625, 0.695831298828125, 0.80902099609375, 0.922210693359375, 1.035400390625, 1.148590087890625, 1.26177978515625, 1.374969482421875, 1.4881591796875, 1.601348876953125, 1.71453857421875, 1.827728271484375, 1.94091796875, 2.054107666015625, 2.16729736328125, 2.280487060546875, 2.3936767578125, 2.506866455078125, 2.62005615234375, 2.733245849609375, 2.846435546875, 2.959625244140625, 3.07281494140625, 3.186004638671875, 3.2991943359375, 3.412384033203125, 3.52557373046875, 3.638763427734375, 3.751953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 2.0, 6.0, 8.0, 10.0, 4.0, 12.0, 19.0, 27.0, 18.0, 22.0, 32.0, 37.0, 40.0, 52.0, 43.0, 44.0, 47.0, 57.0, 56.0, 51.0, 65.0, 52.0, 36.0, 39.0, 45.0, 26.0, 24.0, 22.0, 20.0, 10.0, 22.0, 15.0, 6.0, 6.0, 2.0, 9.0, 5.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.91796875, -5.7501220703125, -5.582275390625, -5.4144287109375, -5.24658203125, -5.0787353515625, -4.910888671875, -4.7430419921875, -4.5751953125, -4.4073486328125, -4.239501953125, -4.0716552734375, -3.90380859375, -3.7359619140625, -3.568115234375, -3.4002685546875, -3.232421875, -3.0645751953125, -2.896728515625, -2.7288818359375, -2.56103515625, -2.3931884765625, -2.225341796875, -2.0574951171875, -1.8896484375, -1.7218017578125, -1.553955078125, -1.3861083984375, -1.21826171875, -1.0504150390625, -0.882568359375, -0.7147216796875, -0.546875, -0.3790283203125, -0.211181640625, -0.0433349609375, 0.12451171875, 0.2923583984375, 0.460205078125, 0.6280517578125, 0.7958984375, 0.9637451171875, 1.131591796875, 1.2994384765625, 1.46728515625, 1.6351318359375, 1.802978515625, 1.9708251953125, 2.138671875, 2.3065185546875, 2.474365234375, 2.6422119140625, 2.81005859375, 2.9779052734375, 3.145751953125, 3.3135986328125, 3.4814453125, 3.6492919921875, 3.817138671875, 3.9849853515625, 4.15283203125, 4.3206787109375, 4.488525390625, 4.6563720703125, 4.82421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 10.0, 16.0, 33.0, 56.0, 75.0, 186.0, 510.0, 1235.0, 5197.0, 56685.0, 842057.0, 131028.0, 8684.0, 1714.0, 586.0, 261.0, 104.0, 55.0, 23.0, 14.0, 12.0, 10.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.833984375, -2.7606201171875, -2.687255859375, -2.6138916015625, -2.54052734375, -2.4671630859375, -2.393798828125, -2.3204345703125, -2.2470703125, -2.1737060546875, -2.100341796875, -2.0269775390625, -1.95361328125, -1.8802490234375, -1.806884765625, -1.7335205078125, -1.66015625, -1.5867919921875, -1.513427734375, -1.4400634765625, -1.36669921875, -1.2933349609375, -1.219970703125, -1.1466064453125, -1.0732421875, -0.9998779296875, -0.926513671875, -0.8531494140625, -0.77978515625, -0.7064208984375, -0.633056640625, -0.5596923828125, -0.486328125, -0.4129638671875, -0.339599609375, -0.2662353515625, -0.19287109375, -0.1195068359375, -0.046142578125, 0.0272216796875, 0.1005859375, 0.1739501953125, 0.247314453125, 0.3206787109375, 0.39404296875, 0.4674072265625, 0.540771484375, 0.6141357421875, 0.6875, 0.7608642578125, 0.834228515625, 0.9075927734375, 0.98095703125, 1.0543212890625, 1.127685546875, 1.2010498046875, 1.2744140625, 1.3477783203125, 1.421142578125, 1.4945068359375, 1.56787109375, 1.6412353515625, 1.714599609375, 1.7879638671875, 1.861328125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 10.0, 10.0, 12.0, 14.0, 20.0, 26.0, 51.0, 57.0, 81.0, 87.0, 119.0, 98.0, 88.0, 84.0, 68.0, 50.0, 28.0, 33.0, 22.0, 13.0, 6.0, 12.0, 4.0, 5.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002033710479736328, -0.00019684992730617523, -0.00019032880663871765, -0.00018380768597126007, -0.0001772865653038025, -0.0001707654446363449, -0.00016424432396888733, -0.00015772320330142975, -0.00015120208263397217, -0.0001446809619665146, -0.000138159841299057, -0.00013163872063159943, -0.00012511759996414185, -0.00011859647929668427, -0.00011207535862922668, -0.0001055542379617691, -9.903311729431152e-05, -9.251199662685394e-05, -8.599087595939636e-05, -7.946975529193878e-05, -7.29486346244812e-05, -6.642751395702362e-05, -5.990639328956604e-05, -5.338527262210846e-05, -4.686415195465088e-05, -4.03430312871933e-05, -3.382191061973572e-05, -2.7300789952278137e-05, -2.0779669284820557e-05, -1.4258548617362976e-05, -7.737427949905396e-06, -1.216307282447815e-06, 5.304813385009766e-06, 1.1825934052467346e-05, 1.8347054719924927e-05, 2.4868175387382507e-05, 3.138929605484009e-05, 3.791041672229767e-05, 4.443153738975525e-05, 5.095265805721283e-05, 5.747377872467041e-05, 6.399489939212799e-05, 7.051602005958557e-05, 7.703714072704315e-05, 8.355826139450073e-05, 9.007938206195831e-05, 9.66005027294159e-05, 0.00010312162339687347, 0.00010964274406433105, 0.00011616386473178864, 0.00012268498539924622, 0.0001292061060667038, 0.00013572722673416138, 0.00014224834740161896, 0.00014876946806907654, 0.00015529058873653412, 0.0001618117094039917, 0.00016833283007144928, 0.00017485395073890686, 0.00018137507140636444, 0.00018789619207382202, 0.0001944173127412796, 0.00020093843340873718, 0.00020745955407619476, 0.00021398067474365234]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 5.0, 2.0, 9.0, 10.0, 10.0, 19.0, 44.0, 47.0, 65.0, 152.0, 246.0, 823.0, 3832.0, 32939.0, 633989.0, 354246.0, 18465.0, 2558.0, 592.0, 224.0, 103.0, 59.0, 30.0, 39.0, 22.0, 15.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9267578125, -1.8550872802734375, -1.783416748046875, -1.7117462158203125, -1.64007568359375, -1.5684051513671875, -1.496734619140625, -1.4250640869140625, -1.3533935546875, -1.2817230224609375, -1.210052490234375, -1.1383819580078125, -1.06671142578125, -0.9950408935546875, -0.923370361328125, -0.8516998291015625, -0.780029296875, -0.7083587646484375, -0.636688232421875, -0.5650177001953125, -0.49334716796875, -0.4216766357421875, -0.350006103515625, -0.2783355712890625, -0.2066650390625, -0.1349945068359375, -0.063323974609375, 0.0083465576171875, 0.08001708984375, 0.1516876220703125, 0.223358154296875, 0.2950286865234375, 0.36669921875, 0.4383697509765625, 0.510040283203125, 0.5817108154296875, 0.65338134765625, 0.7250518798828125, 0.796722412109375, 0.8683929443359375, 0.9400634765625, 1.0117340087890625, 1.083404541015625, 1.1550750732421875, 1.22674560546875, 1.2984161376953125, 1.370086669921875, 1.4417572021484375, 1.513427734375, 1.5850982666015625, 1.656768798828125, 1.7284393310546875, 1.80010986328125, 1.8717803955078125, 1.943450927734375, 2.0151214599609375, 2.0867919921875, 2.1584625244140625, 2.230133056640625, 2.3018035888671875, 2.37347412109375, 2.4451446533203125, 2.516815185546875, 2.5884857177734375, 2.66015625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 12.0, 15.0, 28.0, 59.0, 136.0, 183.0, 221.0, 143.0, 88.0, 47.0, 24.0, 18.0, 10.0, 13.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8359375, -4.7314605712890625, -4.626983642578125, -4.5225067138671875, -4.41802978515625, -4.3135528564453125, -4.209075927734375, -4.1045989990234375, -4.0001220703125, -3.8956451416015625, -3.791168212890625, -3.6866912841796875, -3.58221435546875, -3.4777374267578125, -3.373260498046875, -3.2687835693359375, -3.164306640625, -3.0598297119140625, -2.955352783203125, -2.8508758544921875, -2.74639892578125, -2.6419219970703125, -2.537445068359375, -2.4329681396484375, -2.3284912109375, -2.2240142822265625, -2.119537353515625, -2.0150604248046875, -1.91058349609375, -1.8061065673828125, -1.701629638671875, -1.5971527099609375, -1.49267578125, -1.3881988525390625, -1.283721923828125, -1.1792449951171875, -1.07476806640625, -0.9702911376953125, -0.865814208984375, -0.7613372802734375, -0.6568603515625, -0.5523834228515625, -0.447906494140625, -0.3434295654296875, -0.23895263671875, -0.1344757080078125, -0.029998779296875, 0.0744781494140625, 0.178955078125, 0.2834320068359375, 0.387908935546875, 0.4923858642578125, 0.59686279296875, 0.7013397216796875, 0.805816650390625, 0.9102935791015625, 1.0147705078125, 1.1192474365234375, 1.223724365234375, 1.3282012939453125, 1.43267822265625, 1.5371551513671875, 1.641632080078125, 1.7461090087890625, 1.8505859375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 10.0, 31.0, 112.0, 352.0, 365.0, 95.0, 29.0, 8.0, 4.0, 3.0, 1.0], "bins": [-135.000244140625, -132.6308135986328, -130.26138305664062, -127.89196014404297, -125.52253723144531, -123.15310668945312, -120.78367614746094, -118.41424560546875, -116.0448226928711, -113.6753921508789, -111.30596923828125, -108.93653869628906, -106.56710815429688, -104.19768524169922, -101.82825469970703, -99.45883178710938, -97.08940124511719, -94.719970703125, -92.35054779052734, -89.98111724853516, -87.6116943359375, -85.24226379394531, -82.87283325195312, -80.50340270996094, -78.13397979736328, -75.7645492553711, -73.39512634277344, -71.02569580078125, -68.65626525878906, -66.2868423461914, -63.91741180419922, -61.5479850769043, -59.178550720214844, -56.80912399291992, -54.439697265625, -52.07026672363281, -49.70083999633789, -47.33141326904297, -44.96198272705078, -42.59255599975586, -40.22312927246094, -37.853702545166016, -35.484275817871094, -33.114845275878906, -30.745418548583984, -28.375991821289062, -26.006563186645508, -23.637134552001953, -21.267709732055664, -18.89828109741211, -16.528854370117188, -14.15942668914795, -11.789999008178711, -9.420571327209473, -7.051143646240234, -4.68171501159668, -2.312288284301758, 0.05713939666748047, 2.4265670776367188, 4.795994758605957, 7.165422439575195, 9.534850120544434, 11.904277801513672, 14.273706436157227, 16.64313316345215]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 9.0, 7.0, 6.0, 10.0, 8.0, 10.0, 18.0, 13.0, 27.0, 22.0, 36.0, 49.0, 37.0, 42.0, 40.0, 60.0, 46.0, 36.0, 51.0, 47.0, 50.0, 43.0, 51.0, 42.0, 34.0, 29.0, 24.0, 32.0, 23.0, 17.0, 12.0, 10.0, 15.0, 5.0, 7.0, 5.0, 9.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 3.0], "bins": [-29.18497657775879, -28.389577865600586, -27.594179153442383, -26.79878044128418, -26.003381729125977, -25.207983016967773, -24.412586212158203, -23.6171875, -22.821788787841797, -22.026390075683594, -21.23099136352539, -20.435592651367188, -19.640193939208984, -18.84479522705078, -18.049396514892578, -17.253997802734375, -16.458599090576172, -15.663200378417969, -14.867801666259766, -14.072402954101562, -13.27700424194336, -12.481605529785156, -11.68620777130127, -10.890809059143066, -10.095410346984863, -9.30001163482666, -8.504612922668457, -7.709214687347412, -6.913815975189209, -6.118417263031006, -5.323019027709961, -4.527620315551758, -3.732219696044922, -2.9368209838867188, -2.1414225101470947, -1.3460240364074707, -0.5506253242492676, 0.24477338790893555, 1.0401716232299805, 1.8355703353881836, 2.6309690475463867, 3.42636775970459, 4.221766471862793, 5.017164707183838, 5.812563419342041, 6.607962131500244, 7.403360366821289, 8.198759078979492, 8.994157791137695, 9.789556503295898, 10.584955215454102, 11.380353927612305, 12.175752639770508, 12.971151351928711, 13.766549110412598, 14.5619478225708, 15.357346534729004, 16.15274429321289, 16.948143005371094, 17.743541717529297, 18.5389404296875, 19.334339141845703, 20.129737854003906, 20.92513656616211, 21.720535278320312]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 7.0, 4.0, 9.0, 12.0, 10.0, 12.0, 15.0, 19.0, 22.0, 45.0, 48.0, 69.0, 80.0, 130.0, 151.0, 185.0, 312.0, 451.0, 635.0, 1030.0, 1981.0, 5371.0, 80901.0, 4090127.0, 6942.0, 2237.0, 1146.0, 701.0, 450.0, 284.0, 218.0, 146.0, 131.0, 81.0, 64.0, 45.0, 43.0, 41.0, 20.0, 22.0, 26.0, 7.0, 9.0, 14.0, 11.0, 6.0, 2.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-5.86328125, -5.6746826171875, -5.486083984375, -5.2974853515625, -5.10888671875, -4.9202880859375, -4.731689453125, -4.5430908203125, -4.3544921875, -4.1658935546875, -3.977294921875, -3.7886962890625, -3.60009765625, -3.4114990234375, -3.222900390625, -3.0343017578125, -2.845703125, -2.6571044921875, -2.468505859375, -2.2799072265625, -2.09130859375, -1.9027099609375, -1.714111328125, -1.5255126953125, -1.3369140625, -1.1483154296875, -0.959716796875, -0.7711181640625, -0.58251953125, -0.3939208984375, -0.205322265625, -0.0167236328125, 0.171875, 0.3604736328125, 0.549072265625, 0.7376708984375, 0.92626953125, 1.1148681640625, 1.303466796875, 1.4920654296875, 1.6806640625, 1.8692626953125, 2.057861328125, 2.2464599609375, 2.43505859375, 2.6236572265625, 2.812255859375, 3.0008544921875, 3.189453125, 3.3780517578125, 3.566650390625, 3.7552490234375, 3.94384765625, 4.1324462890625, 4.321044921875, 4.5096435546875, 4.6982421875, 4.8868408203125, 5.075439453125, 5.2640380859375, 5.45263671875, 5.6412353515625, 5.829833984375, 6.0184326171875, 6.20703125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 6.0, 6.0, 16.0, 9.0, 22.0, 16.0, 25.0, 16.0, 25.0, 33.0, 29.0, 30.0, 33.0, 44.0, 58.0, 52.0, 59.0, 52.0, 37.0, 50.0, 46.0, 43.0, 37.0, 35.0, 31.0, 22.0, 27.0, 17.0, 24.0, 18.0, 17.0, 11.0, 7.0, 9.0, 9.0, 5.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.3125, -1.2762603759765625, -1.240020751953125, -1.2037811279296875, -1.16754150390625, -1.1313018798828125, -1.095062255859375, -1.0588226318359375, -1.0225830078125, -0.9863433837890625, -0.950103759765625, -0.9138641357421875, -0.87762451171875, -0.8413848876953125, -0.805145263671875, -0.7689056396484375, -0.732666015625, -0.6964263916015625, -0.660186767578125, -0.6239471435546875, -0.58770751953125, -0.5514678955078125, -0.515228271484375, -0.4789886474609375, -0.4427490234375, -0.4065093994140625, -0.370269775390625, -0.3340301513671875, -0.29779052734375, -0.2615509033203125, -0.225311279296875, -0.1890716552734375, -0.15283203125, -0.1165924072265625, -0.080352783203125, -0.0441131591796875, -0.00787353515625, 0.0283660888671875, 0.064605712890625, 0.1008453369140625, 0.1370849609375, 0.1733245849609375, 0.209564208984375, 0.2458038330078125, 0.28204345703125, 0.3182830810546875, 0.354522705078125, 0.3907623291015625, 0.427001953125, 0.4632415771484375, 0.499481201171875, 0.5357208251953125, 0.57196044921875, 0.6082000732421875, 0.644439697265625, 0.6806793212890625, 0.7169189453125, 0.7531585693359375, 0.789398193359375, 0.8256378173828125, 0.86187744140625, 0.8981170654296875, 0.934356689453125, 0.9705963134765625, 1.0068359375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 7.0, 9.0, 18.0, 19.0, 22.0, 37.0, 45.0, 92.0, 125.0, 171.0, 225.0, 355.0, 597.0, 980.0, 1710.0, 3937.0, 13490.0, 4120800.0, 40092.0, 5909.0, 2358.0, 1195.0, 716.0, 433.0, 271.0, 206.0, 127.0, 99.0, 79.0, 45.0, 33.0, 24.0, 9.0, 12.0, 7.0, 7.0, 8.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5390625, -6.326171875, -6.11328125, -5.900390625, -5.6875, -5.474609375, -5.26171875, -5.048828125, -4.8359375, -4.623046875, -4.41015625, -4.197265625, -3.984375, -3.771484375, -3.55859375, -3.345703125, -3.1328125, -2.919921875, -2.70703125, -2.494140625, -2.28125, -2.068359375, -1.85546875, -1.642578125, -1.4296875, -1.216796875, -1.00390625, -0.791015625, -0.578125, -0.365234375, -0.15234375, 0.060546875, 0.2734375, 0.486328125, 0.69921875, 0.912109375, 1.125, 1.337890625, 1.55078125, 1.763671875, 1.9765625, 2.189453125, 2.40234375, 2.615234375, 2.828125, 3.041015625, 3.25390625, 3.466796875, 3.6796875, 3.892578125, 4.10546875, 4.318359375, 4.53125, 4.744140625, 4.95703125, 5.169921875, 5.3828125, 5.595703125, 5.80859375, 6.021484375, 6.234375, 6.447265625, 6.66015625, 6.873046875, 7.0859375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 7.0, 25.0, 220.0, 3772.0, 23.0, 5.0, 5.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9140625, -1.840728759765625, -1.76739501953125, -1.694061279296875, -1.6207275390625, -1.547393798828125, -1.47406005859375, -1.400726318359375, -1.327392578125, -1.254058837890625, -1.18072509765625, -1.107391357421875, -1.0340576171875, -0.960723876953125, -0.88739013671875, -0.814056396484375, -0.74072265625, -0.667388916015625, -0.59405517578125, -0.520721435546875, -0.4473876953125, -0.374053955078125, -0.30072021484375, -0.227386474609375, -0.154052734375, -0.080718994140625, -0.00738525390625, 0.065948486328125, 0.1392822265625, 0.212615966796875, 0.28594970703125, 0.359283447265625, 0.4326171875, 0.505950927734375, 0.57928466796875, 0.652618408203125, 0.7259521484375, 0.799285888671875, 0.87261962890625, 0.945953369140625, 1.019287109375, 1.092620849609375, 1.16595458984375, 1.239288330078125, 1.3126220703125, 1.385955810546875, 1.45928955078125, 1.532623291015625, 1.60595703125, 1.679290771484375, 1.75262451171875, 1.825958251953125, 1.8992919921875, 1.972625732421875, 2.04595947265625, 2.119293212890625, 2.192626953125, 2.265960693359375, 2.33929443359375, 2.412628173828125, 2.4859619140625, 2.559295654296875, 2.63262939453125, 2.705963134765625, 2.779296875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 7.0, 25.0, 31.0, 104.0, 229.0, 320.0, 187.0, 65.0, 25.0, 10.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.578746795654297, -12.330116271972656, -12.0814847946167, -11.832854270935059, -11.584222793579102, -11.335592269897461, -11.08696174621582, -10.838330268859863, -10.589699745178223, -10.341069221496582, -10.092437744140625, -9.843807220458984, -9.595176696777344, -9.346545219421387, -9.097914695739746, -8.849283218383789, -8.600652694702148, -8.352022171020508, -8.10339069366455, -7.85476016998291, -7.606129169464111, -7.3574981689453125, -7.108867645263672, -6.860236644744873, -6.611605644226074, -6.362974643707275, -6.114343643188477, -5.865713119506836, -5.617082118988037, -5.368451118469238, -5.119820594787598, -4.871189594268799, -4.622559070587158, -4.373928070068359, -4.125297546386719, -3.87666654586792, -3.628035545349121, -3.3794045448303223, -3.1307737827301025, -2.882143020629883, -2.633512020111084, -2.384881019592285, -2.1362502574920654, -1.8876193761825562, -1.6389884948730469, -1.3903576135635376, -1.1417267322540283, -0.893095850944519, -0.6444649696350098, -0.3958340883255005, -0.1472032070159912, 0.10142767429351807, 0.35005855560302734, 0.5986894369125366, 0.8473203182220459, 1.0959511995315552, 1.3445820808410645, 1.5932129621505737, 1.841843843460083, 2.0904746055603027, 2.3391056060791016, 2.5877366065979004, 2.83636736869812, 3.08499813079834, 3.3336291313171387]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 9.0, 5.0, 10.0, 6.0, 6.0, 7.0, 12.0, 10.0, 26.0, 22.0, 21.0, 29.0, 36.0, 33.0, 27.0, 33.0, 46.0, 30.0, 38.0, 31.0, 31.0, 38.0, 38.0, 31.0, 35.0, 37.0, 46.0, 42.0, 32.0, 34.0, 31.0, 27.0, 21.0, 15.0, 14.0, 18.0, 11.0, 18.0, 6.0, 8.0, 5.0, 5.0, 2.0, 4.0, 6.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2910361289978027, -2.211760997772217, -2.132485866546631, -2.053210973739624, -1.973935842514038, -1.8946607112884521, -1.8153855800628662, -1.7361104488372803, -1.6568354368209839, -1.577560305595398, -1.4982852935791016, -1.4190101623535156, -1.3397350311279297, -1.2604600191116333, -1.1811848878860474, -1.101909875869751, -1.022634744644165, -0.9433596730232239, -0.8640846014022827, -0.7848094701766968, -0.7055343985557556, -0.6262593269348145, -0.5469841957092285, -0.46770912408828735, -0.3884340524673462, -0.30915898084640503, -0.22988387942314148, -0.15060879290103912, -0.07133370637893677, 0.007941365242004395, 0.08721646666526794, 0.1664915680885315, 0.24576640129089355, 0.3250414729118347, 0.40431657433509827, 0.4835916757583618, 0.562866747379303, 0.6421418190002441, 0.7214169502258301, 0.8006920218467712, 0.8799670934677124, 0.9592421650886536, 1.0385172367095947, 1.1177923679351807, 1.1970674991607666, 1.276342511177063, 1.355617642402649, 1.4348926544189453, 1.5141677856445312, 1.5934429168701172, 1.6727179288864136, 1.7519930601119995, 1.831268072128296, 1.9105432033538818, 1.9898183345794678, 2.0690934658050537, 2.1483683586120605, 2.2276434898376465, 2.3069186210632324, 2.3861935138702393, 2.465468645095825, 2.544743776321411, 2.624018907546997, 2.703294038772583, 2.782569169998169]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 7.0, 5.0, 13.0, 6.0, 13.0, 29.0, 40.0, 56.0, 91.0, 119.0, 187.0, 307.0, 478.0, 766.0, 1209.0, 2062.0, 3585.0, 5972.0, 10755.0, 19510.0, 37664.0, 76723.0, 162339.0, 278060.0, 224192.0, 110897.0, 53395.0, 26482.0, 14264.0, 7930.0, 4593.0, 2653.0, 1532.0, 957.0, 622.0, 361.0, 239.0, 132.0, 79.0, 72.0, 50.0, 33.0, 14.0, 23.0, 21.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9501953125, -1.8846282958984375, -1.819061279296875, -1.7534942626953125, -1.68792724609375, -1.6223602294921875, -1.556793212890625, -1.4912261962890625, -1.4256591796875, -1.3600921630859375, -1.294525146484375, -1.2289581298828125, -1.16339111328125, -1.0978240966796875, -1.032257080078125, -0.9666900634765625, -0.901123046875, -0.8355560302734375, -0.769989013671875, -0.7044219970703125, -0.63885498046875, -0.5732879638671875, -0.507720947265625, -0.4421539306640625, -0.3765869140625, -0.3110198974609375, -0.245452880859375, -0.1798858642578125, -0.11431884765625, -0.0487518310546875, 0.016815185546875, 0.0823822021484375, 0.14794921875, 0.2135162353515625, 0.279083251953125, 0.3446502685546875, 0.41021728515625, 0.4757843017578125, 0.541351318359375, 0.6069183349609375, 0.6724853515625, 0.7380523681640625, 0.803619384765625, 0.8691864013671875, 0.93475341796875, 1.0003204345703125, 1.065887451171875, 1.1314544677734375, 1.197021484375, 1.2625885009765625, 1.328155517578125, 1.3937225341796875, 1.45928955078125, 1.5248565673828125, 1.590423583984375, 1.6559906005859375, 1.7215576171875, 1.7871246337890625, 1.852691650390625, 1.9182586669921875, 1.98382568359375, 2.0493927001953125, 2.114959716796875, 2.1805267333984375, 2.24609375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 7.0, 4.0, 7.0, 8.0, 7.0, 14.0, 10.0, 12.0, 10.0, 13.0, 14.0, 21.0, 20.0, 17.0, 18.0, 39.0, 26.0, 18.0, 25.0, 29.0, 38.0, 44.0, 35.0, 48.0, 47.0, 30.0, 39.0, 41.0, 36.0, 38.0, 27.0, 29.0, 31.0, 25.0, 21.0, 22.0, 17.0, 21.0, 15.0, 15.0, 7.0, 11.0, 8.0, 13.0, 7.0, 7.0, 4.0, 1.0, 4.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0], "bins": [-1.169921875, -1.1348724365234375, -1.099822998046875, -1.0647735595703125, -1.02972412109375, -0.9946746826171875, -0.959625244140625, -0.9245758056640625, -0.8895263671875, -0.8544769287109375, -0.819427490234375, -0.7843780517578125, -0.74932861328125, -0.7142791748046875, -0.679229736328125, -0.6441802978515625, -0.609130859375, -0.5740814208984375, -0.539031982421875, -0.5039825439453125, -0.46893310546875, -0.4338836669921875, -0.398834228515625, -0.3637847900390625, -0.3287353515625, -0.2936859130859375, -0.258636474609375, -0.2235870361328125, -0.18853759765625, -0.1534881591796875, -0.118438720703125, -0.0833892822265625, -0.04833984375, -0.0132904052734375, 0.021759033203125, 0.0568084716796875, 0.09185791015625, 0.1269073486328125, 0.161956787109375, 0.1970062255859375, 0.2320556640625, 0.2671051025390625, 0.302154541015625, 0.3372039794921875, 0.37225341796875, 0.4073028564453125, 0.442352294921875, 0.4774017333984375, 0.512451171875, 0.5475006103515625, 0.582550048828125, 0.6175994873046875, 0.65264892578125, 0.6876983642578125, 0.722747802734375, 0.7577972412109375, 0.7928466796875, 0.8278961181640625, 0.862945556640625, 0.8979949951171875, 0.93304443359375, 0.9680938720703125, 1.003143310546875, 1.0381927490234375, 1.0732421875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 1.0, 8.0, 4.0, 5.0, 9.0, 8.0, 11.0, 17.0, 14.0, 27.0, 44.0, 58.0, 70.0, 144.0, 280.0, 742.0, 1835.0, 5348.0, 17945.0, 79735.0, 510146.0, 355407.0, 56112.0, 13753.0, 4110.0, 1448.0, 574.0, 297.0, 124.0, 79.0, 49.0, 34.0, 21.0, 23.0, 15.0, 10.0, 8.0, 14.0, 6.0, 1.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.51953125, -5.356689453125, -5.19384765625, -5.031005859375, -4.8681640625, -4.705322265625, -4.54248046875, -4.379638671875, -4.216796875, -4.053955078125, -3.89111328125, -3.728271484375, -3.5654296875, -3.402587890625, -3.23974609375, -3.076904296875, -2.9140625, -2.751220703125, -2.58837890625, -2.425537109375, -2.2626953125, -2.099853515625, -1.93701171875, -1.774169921875, -1.611328125, -1.448486328125, -1.28564453125, -1.122802734375, -0.9599609375, -0.797119140625, -0.63427734375, -0.471435546875, -0.30859375, -0.145751953125, 0.01708984375, 0.179931640625, 0.3427734375, 0.505615234375, 0.66845703125, 0.831298828125, 0.994140625, 1.156982421875, 1.31982421875, 1.482666015625, 1.6455078125, 1.808349609375, 1.97119140625, 2.134033203125, 2.296875, 2.459716796875, 2.62255859375, 2.785400390625, 2.9482421875, 3.111083984375, 3.27392578125, 3.436767578125, 3.599609375, 3.762451171875, 3.92529296875, 4.088134765625, 4.2509765625, 4.413818359375, 4.57666015625, 4.739501953125, 4.90234375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 13.0, 8.0, 6.0, 30.0, 23.0, 18.0, 19.0, 25.0, 30.0, 27.0, 47.0, 32.0, 46.0, 48.0, 49.0, 61.0, 50.0, 35.0, 45.0, 42.0, 38.0, 45.0, 37.0, 34.0, 35.0, 31.0, 23.0, 20.0, 14.0, 11.0, 9.0, 4.0, 6.0, 7.0, 4.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.0703125, -7.8135986328125, -7.556884765625, -7.3001708984375, -7.04345703125, -6.7867431640625, -6.530029296875, -6.2733154296875, -6.0166015625, -5.7598876953125, -5.503173828125, -5.2464599609375, -4.98974609375, -4.7330322265625, -4.476318359375, -4.2196044921875, -3.962890625, -3.7061767578125, -3.449462890625, -3.1927490234375, -2.93603515625, -2.6793212890625, -2.422607421875, -2.1658935546875, -1.9091796875, -1.6524658203125, -1.395751953125, -1.1390380859375, -0.88232421875, -0.6256103515625, -0.368896484375, -0.1121826171875, 0.14453125, 0.4012451171875, 0.657958984375, 0.9146728515625, 1.17138671875, 1.4281005859375, 1.684814453125, 1.9415283203125, 2.1982421875, 2.4549560546875, 2.711669921875, 2.9683837890625, 3.22509765625, 3.4818115234375, 3.738525390625, 3.9952392578125, 4.251953125, 4.5086669921875, 4.765380859375, 5.0220947265625, 5.27880859375, 5.5355224609375, 5.792236328125, 6.0489501953125, 6.3056640625, 6.5623779296875, 6.819091796875, 7.0758056640625, 7.33251953125, 7.5892333984375, 7.845947265625, 8.1026611328125, 8.359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 16.0, 20.0, 30.0, 59.0, 110.0, 271.0, 596.0, 2175.0, 12020.0, 560777.0, 458376.0, 10987.0, 2042.0, 601.0, 221.0, 95.0, 71.0, 23.0, 19.0, 11.0, 6.0, 3.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0859375, -4.9520263671875, -4.818115234375, -4.6842041015625, -4.55029296875, -4.4163818359375, -4.282470703125, -4.1485595703125, -4.0146484375, -3.8807373046875, -3.746826171875, -3.6129150390625, -3.47900390625, -3.3450927734375, -3.211181640625, -3.0772705078125, -2.943359375, -2.8094482421875, -2.675537109375, -2.5416259765625, -2.40771484375, -2.2738037109375, -2.139892578125, -2.0059814453125, -1.8720703125, -1.7381591796875, -1.604248046875, -1.4703369140625, -1.33642578125, -1.2025146484375, -1.068603515625, -0.9346923828125, -0.80078125, -0.6668701171875, -0.532958984375, -0.3990478515625, -0.26513671875, -0.1312255859375, 0.002685546875, 0.1365966796875, 0.2705078125, 0.4044189453125, 0.538330078125, 0.6722412109375, 0.80615234375, 0.9400634765625, 1.073974609375, 1.2078857421875, 1.341796875, 1.4757080078125, 1.609619140625, 1.7435302734375, 1.87744140625, 2.0113525390625, 2.145263671875, 2.2791748046875, 2.4130859375, 2.5469970703125, 2.680908203125, 2.8148193359375, 2.94873046875, 3.0826416015625, 3.216552734375, 3.3504638671875, 3.484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 10.0, 18.0, 29.0, 43.0, 81.0, 119.0, 166.0, 156.0, 140.0, 78.0, 58.0, 36.0, 21.0, 14.0, 11.0, 5.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042939186096191406, -0.0004164353013038635, -0.000403478741645813, -0.00039052218198776245, -0.0003775656223297119, -0.0003646090626716614, -0.00035165250301361084, -0.0003386959433555603, -0.00032573938369750977, -0.00031278282403945923, -0.0002998262643814087, -0.00028686970472335815, -0.0002739131450653076, -0.0002609565854072571, -0.00024800002574920654, -0.000235043466091156, -0.00022208690643310547, -0.00020913034677505493, -0.0001961737871170044, -0.00018321722745895386, -0.00017026066780090332, -0.00015730410814285278, -0.00014434754848480225, -0.0001313909888267517, -0.00011843442916870117, -0.00010547786951065063, -9.25213098526001e-05, -7.956475019454956e-05, -6.660819053649902e-05, -5.3651630878448486e-05, -4.069507122039795e-05, -2.7738511562347412e-05, -1.4781951904296875e-05, -1.8253922462463379e-06, 1.11311674118042e-05, 2.4087727069854736e-05, 3.7044286727905273e-05, 5.000084638595581e-05, 6.295740604400635e-05, 7.591396570205688e-05, 8.887052536010742e-05, 0.00010182708501815796, 0.0001147836446762085, 0.00012774020433425903, 0.00014069676399230957, 0.0001536533236503601, 0.00016660988330841064, 0.00017956644296646118, 0.00019252300262451172, 0.00020547956228256226, 0.0002184361219406128, 0.00023139268159866333, 0.00024434924125671387, 0.0002573058009147644, 0.00027026236057281494, 0.0002832189202308655, 0.000296175479888916, 0.00030913203954696655, 0.0003220885992050171, 0.0003350451588630676, 0.00034800171852111816, 0.0003609582781791687, 0.00037391483783721924, 0.0003868713974952698, 0.0003998279571533203]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 2.0, 7.0, 16.0, 22.0, 52.0, 124.0, 421.0, 3538.0, 373491.0, 665552.0, 4579.0, 504.0, 116.0, 63.0, 32.0, 14.0, 6.0, 6.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5625, -8.36810302734375, -8.1737060546875, -7.97930908203125, -7.784912109375, -7.59051513671875, -7.3961181640625, -7.20172119140625, -7.00732421875, -6.81292724609375, -6.6185302734375, -6.42413330078125, -6.229736328125, -6.03533935546875, -5.8409423828125, -5.64654541015625, -5.4521484375, -5.25775146484375, -5.0633544921875, -4.86895751953125, -4.674560546875, -4.48016357421875, -4.2857666015625, -4.09136962890625, -3.89697265625, -3.70257568359375, -3.5081787109375, -3.31378173828125, -3.119384765625, -2.92498779296875, -2.7305908203125, -2.53619384765625, -2.341796875, -2.14739990234375, -1.9530029296875, -1.75860595703125, -1.564208984375, -1.36981201171875, -1.1754150390625, -0.98101806640625, -0.78662109375, -0.59222412109375, -0.3978271484375, -0.20343017578125, -0.009033203125, 0.18536376953125, 0.3797607421875, 0.57415771484375, 0.7685546875, 0.96295166015625, 1.1573486328125, 1.35174560546875, 1.546142578125, 1.74053955078125, 1.9349365234375, 2.12933349609375, 2.32373046875, 2.51812744140625, 2.7125244140625, 2.90692138671875, 3.101318359375, 3.29571533203125, 3.4901123046875, 3.68450927734375, 3.87890625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 9.0, 6.0, 12.0, 22.0, 35.0, 55.0, 73.0, 97.0, 159.0, 164.0, 123.0, 78.0, 55.0, 25.0, 20.0, 18.0, 10.0, 10.0, 11.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.40625, -4.29400634765625, -4.1817626953125, -4.06951904296875, -3.957275390625, -3.84503173828125, -3.7327880859375, -3.62054443359375, -3.50830078125, -3.39605712890625, -3.2838134765625, -3.17156982421875, -3.059326171875, -2.94708251953125, -2.8348388671875, -2.72259521484375, -2.6103515625, -2.49810791015625, -2.3858642578125, -2.27362060546875, -2.161376953125, -2.04913330078125, -1.9368896484375, -1.82464599609375, -1.71240234375, -1.60015869140625, -1.4879150390625, -1.37567138671875, -1.263427734375, -1.15118408203125, -1.0389404296875, -0.92669677734375, -0.814453125, -0.70220947265625, -0.5899658203125, -0.47772216796875, -0.365478515625, -0.25323486328125, -0.1409912109375, -0.02874755859375, 0.08349609375, 0.19573974609375, 0.3079833984375, 0.42022705078125, 0.532470703125, 0.64471435546875, 0.7569580078125, 0.86920166015625, 0.9814453125, 1.09368896484375, 1.2059326171875, 1.31817626953125, 1.430419921875, 1.54266357421875, 1.6549072265625, 1.76715087890625, 1.87939453125, 1.99163818359375, 2.1038818359375, 2.21612548828125, 2.328369140625, 2.44061279296875, 2.5528564453125, 2.66510009765625, 2.77734375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 22.0, 53.0, 166.0, 301.0, 277.0, 124.0, 39.0, 15.0, 5.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-139.25750732421875, -136.56764221191406, -133.87777709960938, -131.1879119873047, -128.498046875, -125.80818939208984, -123.11832427978516, -120.42845916748047, -117.73859405517578, -115.0487289428711, -112.3588638305664, -109.66899871826172, -106.97914123535156, -104.28927612304688, -101.59941101074219, -98.9095458984375, -96.21968078613281, -93.52981567382812, -90.83995056152344, -88.15008544921875, -85.46022033691406, -82.7703628540039, -80.08049774169922, -77.39063262939453, -74.70076751708984, -72.01090240478516, -69.32103729248047, -66.63117218017578, -63.94131088256836, -61.25144577026367, -58.56158447265625, -55.87171936035156, -53.18185806274414, -50.49199295043945, -47.80213165283203, -45.112266540527344, -42.422401428222656, -39.73253631591797, -37.04267120361328, -34.35280990600586, -31.662944793701172, -28.973079681396484, -26.28321647644043, -23.593353271484375, -20.903488159179688, -18.213623046875, -15.523759841918945, -12.83389663696289, -10.144031524658203, -7.454167366027832, -4.764303207397461, -2.07443904876709, 0.6154251098632812, 3.3052892684936523, 5.995153427124023, 8.685016632080078, 11.374881744384766, 14.064745903015137, 16.754610061645508, 19.444473266601562, 22.13433837890625, 24.824203491210938, 27.514066696166992, 30.203929901123047, 32.893795013427734]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 5.0, 3.0, 2.0, 6.0, 3.0, 7.0, 11.0, 10.0, 12.0, 15.0, 20.0, 18.0, 13.0, 14.0, 19.0, 34.0, 27.0, 37.0, 32.0, 40.0, 39.0, 53.0, 53.0, 51.0, 46.0, 45.0, 42.0, 45.0, 42.0, 41.0, 25.0, 20.0, 27.0, 14.0, 26.0, 21.0, 16.0, 14.0, 11.0, 7.0, 10.0, 6.0, 6.0, 2.0, 6.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0], "bins": [-41.238563537597656, -40.083614349365234, -38.92866134643555, -37.773712158203125, -36.61875915527344, -35.463809967041016, -34.308860778808594, -33.153907775878906, -31.998958587646484, -30.84400749206543, -29.689056396484375, -28.534107208251953, -27.3791561126709, -26.224205017089844, -25.069255828857422, -23.914304733276367, -22.759353637695312, -21.604402542114258, -20.449451446533203, -19.29450225830078, -18.139551162719727, -16.984600067138672, -15.829649925231934, -14.674699783325195, -13.51974868774414, -12.364797592163086, -11.209847450256348, -10.05489730834961, -8.899946212768555, -7.744995594024658, -6.590044975280762, -5.435094833374023, -4.280147552490234, -3.125196933746338, -1.9702463150024414, -0.8152956962585449, 0.33965492248535156, 1.494605541229248, 2.6495561599731445, 3.804506301879883, 4.9594573974609375, 6.114408016204834, 7.2693586349487305, 8.424308776855469, 9.579259872436523, 10.734210968017578, 11.889161109924316, 13.044111251831055, 14.19906234741211, 15.354013442993164, 16.50896453857422, 17.66391372680664, 18.818864822387695, 19.97381591796875, 21.128765106201172, 22.283716201782227, 23.43866729736328, 24.593618392944336, 25.74856948852539, 26.903518676757812, 28.058469772338867, 29.213420867919922, 30.368370056152344, 31.5233211517334, 32.67827224731445]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 10.0, 8.0, 16.0, 11.0, 16.0, 21.0, 21.0, 33.0, 52.0, 72.0, 89.0, 152.0, 242.0, 317.0, 571.0, 805.0, 1619.0, 3540.0, 10514.0, 4018062.0, 142013.0, 8994.0, 3235.0, 1610.0, 797.0, 468.0, 313.0, 192.0, 123.0, 105.0, 58.0, 51.0, 36.0, 24.0, 12.0, 19.0, 10.0, 11.0, 8.0, 7.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0], "bins": [-6.1015625, -5.92181396484375, -5.7420654296875, -5.56231689453125, -5.382568359375, -5.20281982421875, -5.0230712890625, -4.84332275390625, -4.66357421875, -4.48382568359375, -4.3040771484375, -4.12432861328125, -3.944580078125, -3.76483154296875, -3.5850830078125, -3.40533447265625, -3.2255859375, -3.04583740234375, -2.8660888671875, -2.68634033203125, -2.506591796875, -2.32684326171875, -2.1470947265625, -1.96734619140625, -1.78759765625, -1.60784912109375, -1.4281005859375, -1.24835205078125, -1.068603515625, -0.88885498046875, -0.7091064453125, -0.52935791015625, -0.349609375, -0.16986083984375, 0.0098876953125, 0.18963623046875, 0.369384765625, 0.54913330078125, 0.7288818359375, 0.90863037109375, 1.08837890625, 1.26812744140625, 1.4478759765625, 1.62762451171875, 1.807373046875, 1.98712158203125, 2.1668701171875, 2.34661865234375, 2.5263671875, 2.70611572265625, 2.8858642578125, 3.06561279296875, 3.245361328125, 3.42510986328125, 3.6048583984375, 3.78460693359375, 3.96435546875, 4.14410400390625, 4.3238525390625, 4.50360107421875, 4.683349609375, 4.86309814453125, 5.0428466796875, 5.22259521484375, 5.40234375]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 10.0, 3.0, 9.0, 5.0, 6.0, 15.0, 12.0, 20.0, 18.0, 25.0, 24.0, 29.0, 30.0, 43.0, 51.0, 46.0, 61.0, 77.0, 54.0, 59.0, 52.0, 55.0, 37.0, 32.0, 50.0, 32.0, 31.0, 25.0, 18.0, 18.0, 15.0, 10.0, 5.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.078125, -2.0191497802734375, -1.960174560546875, -1.9011993408203125, -1.84222412109375, -1.7832489013671875, -1.724273681640625, -1.6652984619140625, -1.6063232421875, -1.5473480224609375, -1.488372802734375, -1.4293975830078125, -1.37042236328125, -1.3114471435546875, -1.252471923828125, -1.1934967041015625, -1.134521484375, -1.0755462646484375, -1.016571044921875, -0.9575958251953125, -0.89862060546875, -0.8396453857421875, -0.780670166015625, -0.7216949462890625, -0.6627197265625, -0.6037445068359375, -0.544769287109375, -0.4857940673828125, -0.42681884765625, -0.3678436279296875, -0.308868408203125, -0.2498931884765625, -0.19091796875, -0.1319427490234375, -0.072967529296875, -0.0139923095703125, 0.04498291015625, 0.1039581298828125, 0.162933349609375, 0.2219085693359375, 0.2808837890625, 0.3398590087890625, 0.398834228515625, 0.4578094482421875, 0.51678466796875, 0.5757598876953125, 0.634735107421875, 0.6937103271484375, 0.752685546875, 0.8116607666015625, 0.870635986328125, 0.9296112060546875, 0.98858642578125, 1.0475616455078125, 1.106536865234375, 1.1655120849609375, 1.2244873046875, 1.2834625244140625, 1.342437744140625, 1.4014129638671875, 1.46038818359375, 1.5193634033203125, 1.578338623046875, 1.6373138427734375, 1.6962890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 13.0, 9.0, 19.0, 18.0, 22.0, 30.0, 70.0, 76.0, 102.0, 144.0, 196.0, 257.0, 334.0, 505.0, 725.0, 1002.0, 1460.0, 2359.0, 3928.0, 7977.0, 20380.0, 114001.0, 3978647.0, 36551.0, 11564.0, 5215.0, 2839.0, 1766.0, 1204.0, 816.0, 550.0, 378.0, 263.0, 224.0, 164.0, 136.0, 93.0, 66.0, 45.0, 37.0, 20.0, 25.0, 13.0, 10.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0], "bins": [-4.05859375, -3.94000244140625, -3.8214111328125, -3.70281982421875, -3.584228515625, -3.46563720703125, -3.3470458984375, -3.22845458984375, -3.10986328125, -2.99127197265625, -2.8726806640625, -2.75408935546875, -2.635498046875, -2.51690673828125, -2.3983154296875, -2.27972412109375, -2.1611328125, -2.04254150390625, -1.9239501953125, -1.80535888671875, -1.686767578125, -1.56817626953125, -1.4495849609375, -1.33099365234375, -1.21240234375, -1.09381103515625, -0.9752197265625, -0.85662841796875, -0.738037109375, -0.61944580078125, -0.5008544921875, -0.38226318359375, -0.263671875, -0.14508056640625, -0.0264892578125, 0.09210205078125, 0.210693359375, 0.32928466796875, 0.4478759765625, 0.56646728515625, 0.68505859375, 0.80364990234375, 0.9222412109375, 1.04083251953125, 1.159423828125, 1.27801513671875, 1.3966064453125, 1.51519775390625, 1.6337890625, 1.75238037109375, 1.8709716796875, 1.98956298828125, 2.108154296875, 2.22674560546875, 2.3453369140625, 2.46392822265625, 2.58251953125, 2.70111083984375, 2.8197021484375, 2.93829345703125, 3.056884765625, 3.17547607421875, 3.2940673828125, 3.41265869140625, 3.53125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 15.0, 25.0, 39.0, 133.0, 3691.0, 65.0, 34.0, 17.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.560546875, -1.5091400146484375, -1.457733154296875, -1.4063262939453125, -1.35491943359375, -1.3035125732421875, -1.252105712890625, -1.2006988525390625, -1.1492919921875, -1.0978851318359375, -1.046478271484375, -0.9950714111328125, -0.94366455078125, -0.8922576904296875, -0.840850830078125, -0.7894439697265625, -0.738037109375, -0.6866302490234375, -0.635223388671875, -0.5838165283203125, -0.53240966796875, -0.4810028076171875, -0.429595947265625, -0.3781890869140625, -0.3267822265625, -0.2753753662109375, -0.223968505859375, -0.1725616455078125, -0.12115478515625, -0.0697479248046875, -0.018341064453125, 0.0330657958984375, 0.08447265625, 0.1358795166015625, 0.187286376953125, 0.2386932373046875, 0.29010009765625, 0.3415069580078125, 0.392913818359375, 0.4443206787109375, 0.4957275390625, 0.5471343994140625, 0.598541259765625, 0.6499481201171875, 0.70135498046875, 0.7527618408203125, 0.804168701171875, 0.8555755615234375, 0.906982421875, 0.9583892822265625, 1.009796142578125, 1.0612030029296875, 1.11260986328125, 1.1640167236328125, 1.215423583984375, 1.2668304443359375, 1.3182373046875, 1.3696441650390625, 1.421051025390625, 1.4724578857421875, 1.52386474609375, 1.5752716064453125, 1.626678466796875, 1.6780853271484375, 1.7294921875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 1.0, 3.0, 6.0, 19.0, 57.0, 138.0, 246.0, 264.0, 167.0, 66.0, 33.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0913078784942627, -2.789250373840332, -2.4871928691864014, -2.1851353645324707, -1.8830777406692505, -1.5810202360153198, -1.2789626121520996, -0.976905107498169, -0.6748476028442383, -0.37279006838798523, -0.07073253393173218, 0.23132503032684326, 0.5333825349807739, 0.8354400396347046, 1.1374976634979248, 1.4395551681518555, 1.7416126728057861, 2.043670177459717, 2.3457276821136475, 2.647785186767578, 2.949842929840088, 3.2519001960754395, 3.553957939147949, 3.85601544380188, 4.1580729484558105, 4.46013069152832, 4.762187957763672, 5.064245700836182, 5.366302967071533, 5.668360710144043, 5.9704179763793945, 6.272475719451904, 6.574532508850098, 6.876590251922607, 7.178647518157959, 7.480705261230469, 7.78276252746582, 8.084819793701172, 8.38687801361084, 8.688935279846191, 8.990992546081543, 9.293049812316895, 9.595108032226562, 9.897165298461914, 10.199222564697266, 10.501279830932617, 10.803338050842285, 11.105395317077637, 11.407453536987305, 11.709510803222656, 12.011569023132324, 12.313626289367676, 12.615683555603027, 12.917740821838379, 13.219799041748047, 13.521856307983398, 13.82391357421875, 14.125970840454102, 14.42802906036377, 14.730086326599121, 15.032143592834473, 15.334200859069824, 15.636259078979492, 15.938316345214844, 16.240373611450195]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 2.0, 0.0, 6.0, 7.0, 9.0, 14.0, 12.0, 15.0, 12.0, 17.0, 29.0, 23.0, 36.0, 29.0, 27.0, 41.0, 35.0, 47.0, 33.0, 34.0, 40.0, 46.0, 49.0, 58.0, 23.0, 31.0, 41.0, 39.0, 39.0, 29.0, 24.0, 28.0, 19.0, 21.0, 15.0, 16.0, 19.0, 4.0, 9.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.630786657333374, -2.5462396144866943, -2.4616928100585938, -2.377145767211914, -2.2925987243652344, -2.208051919937134, -2.123504877090454, -2.0389580726623535, -1.9544110298156738, -1.8698641061782837, -1.7853171825408936, -1.7007701396942139, -1.6162232160568237, -1.5316762924194336, -1.447129249572754, -1.3625823259353638, -1.2780354022979736, -1.1934884786605835, -1.1089415550231934, -1.0243945121765137, -0.9398475885391235, -0.8553006649017334, -0.7707536816596985, -0.6862066984176636, -0.6016597747802734, -0.5171128511428833, -0.4325658679008484, -0.34801891446113586, -0.26347196102142334, -0.17892500758171082, -0.09437805414199829, -0.009831070899963379, 0.07471561431884766, 0.15926256775856018, 0.2438095211982727, 0.32835647463798523, 0.41290342807769775, 0.4974503815174103, 0.5819973349571228, 0.6665443181991577, 0.7510912418365479, 0.835638165473938, 0.9201851487159729, 1.0047321319580078, 1.089279055595398, 1.173825979232788, 1.2583730220794678, 1.342919945716858, 1.427466869354248, 1.5120137929916382, 1.5965607166290283, 1.681107759475708, 1.7656546831130981, 1.8502016067504883, 1.934748649597168, 2.0192956924438477, 2.1038424968719482, 2.188389539718628, 2.2729363441467285, 2.357483386993408, 2.442030429840088, 2.5265772342681885, 2.611124277114868, 2.6956710815429688, 2.7802181243896484]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 5.0, 10.0, 9.0, 9.0, 18.0, 26.0, 42.0, 80.0, 106.0, 155.0, 239.0, 362.0, 589.0, 1061.0, 1907.0, 3260.0, 5990.0, 11849.0, 24770.0, 56761.0, 143647.0, 323254.0, 276138.0, 111446.0, 44932.0, 20272.0, 9828.0, 5065.0, 2727.0, 1520.0, 919.0, 552.0, 344.0, 206.0, 129.0, 94.0, 69.0, 42.0, 38.0, 20.0, 20.0, 7.0, 12.0, 5.0, 4.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.474609375, -2.388885498046875, -2.30316162109375, -2.217437744140625, -2.1317138671875, -2.045989990234375, -1.96026611328125, -1.874542236328125, -1.788818359375, -1.703094482421875, -1.61737060546875, -1.531646728515625, -1.4459228515625, -1.360198974609375, -1.27447509765625, -1.188751220703125, -1.10302734375, -1.017303466796875, -0.93157958984375, -0.845855712890625, -0.7601318359375, -0.674407958984375, -0.58868408203125, -0.502960205078125, -0.417236328125, -0.331512451171875, -0.24578857421875, -0.160064697265625, -0.0743408203125, 0.011383056640625, 0.09710693359375, 0.182830810546875, 0.2685546875, 0.354278564453125, 0.44000244140625, 0.525726318359375, 0.6114501953125, 0.697174072265625, 0.78289794921875, 0.868621826171875, 0.954345703125, 1.040069580078125, 1.12579345703125, 1.211517333984375, 1.2972412109375, 1.382965087890625, 1.46868896484375, 1.554412841796875, 1.64013671875, 1.725860595703125, 1.81158447265625, 1.897308349609375, 1.9830322265625, 2.068756103515625, 2.15447998046875, 2.240203857421875, 2.325927734375, 2.411651611328125, 2.49737548828125, 2.583099365234375, 2.6688232421875, 2.754547119140625, 2.84027099609375, 2.925994873046875, 3.01171875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 5.0, 9.0, 9.0, 8.0, 7.0, 16.0, 15.0, 9.0, 20.0, 21.0, 23.0, 20.0, 29.0, 29.0, 42.0, 40.0, 42.0, 56.0, 59.0, 49.0, 60.0, 51.0, 33.0, 47.0, 38.0, 44.0, 37.0, 23.0, 25.0, 22.0, 16.0, 16.0, 15.0, 14.0, 5.0, 7.0, 7.0, 5.0, 5.0, 7.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-1.84375, -1.791473388671875, -1.73919677734375, -1.686920166015625, -1.6346435546875, -1.582366943359375, -1.53009033203125, -1.477813720703125, -1.425537109375, -1.373260498046875, -1.32098388671875, -1.268707275390625, -1.2164306640625, -1.164154052734375, -1.11187744140625, -1.059600830078125, -1.00732421875, -0.955047607421875, -0.90277099609375, -0.850494384765625, -0.7982177734375, -0.745941162109375, -0.69366455078125, -0.641387939453125, -0.589111328125, -0.536834716796875, -0.48455810546875, -0.432281494140625, -0.3800048828125, -0.327728271484375, -0.27545166015625, -0.223175048828125, -0.1708984375, -0.118621826171875, -0.06634521484375, -0.014068603515625, 0.0382080078125, 0.090484619140625, 0.14276123046875, 0.195037841796875, 0.247314453125, 0.299591064453125, 0.35186767578125, 0.404144287109375, 0.4564208984375, 0.508697509765625, 0.56097412109375, 0.613250732421875, 0.66552734375, 0.717803955078125, 0.77008056640625, 0.822357177734375, 0.8746337890625, 0.926910400390625, 0.97918701171875, 1.031463623046875, 1.083740234375, 1.136016845703125, 1.18829345703125, 1.240570068359375, 1.2928466796875, 1.345123291015625, 1.39739990234375, 1.449676513671875, 1.501953125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 4.0, 2.0, 5.0, 5.0, 9.0, 28.0, 25.0, 34.0, 40.0, 58.0, 106.0, 144.0, 243.0, 417.0, 786.0, 1782.0, 4959.0, 19424.0, 127489.0, 711144.0, 150764.0, 21733.0, 5425.0, 1934.0, 846.0, 429.0, 256.0, 131.0, 111.0, 61.0, 36.0, 28.0, 28.0, 20.0, 6.0, 10.0, 9.0, 6.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.8984375, -6.6864013671875, -6.474365234375, -6.2623291015625, -6.05029296875, -5.8382568359375, -5.626220703125, -5.4141845703125, -5.2021484375, -4.9901123046875, -4.778076171875, -4.5660400390625, -4.35400390625, -4.1419677734375, -3.929931640625, -3.7178955078125, -3.505859375, -3.2938232421875, -3.081787109375, -2.8697509765625, -2.65771484375, -2.4456787109375, -2.233642578125, -2.0216064453125, -1.8095703125, -1.5975341796875, -1.385498046875, -1.1734619140625, -0.96142578125, -0.7493896484375, -0.537353515625, -0.3253173828125, -0.11328125, 0.0987548828125, 0.310791015625, 0.5228271484375, 0.73486328125, 0.9468994140625, 1.158935546875, 1.3709716796875, 1.5830078125, 1.7950439453125, 2.007080078125, 2.2191162109375, 2.43115234375, 2.6431884765625, 2.855224609375, 3.0672607421875, 3.279296875, 3.4913330078125, 3.703369140625, 3.9154052734375, 4.12744140625, 4.3394775390625, 4.551513671875, 4.7635498046875, 4.9755859375, 5.1876220703125, 5.399658203125, 5.6116943359375, 5.82373046875, 6.0357666015625, 6.247802734375, 6.4598388671875, 6.671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 6.0, 7.0, 11.0, 9.0, 23.0, 22.0, 40.0, 46.0, 56.0, 74.0, 72.0, 92.0, 89.0, 98.0, 80.0, 79.0, 59.0, 42.0, 29.0, 24.0, 17.0, 14.0, 8.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.8125, -19.291259765625, -18.77001953125, -18.248779296875, -17.7275390625, -17.206298828125, -16.68505859375, -16.163818359375, -15.642578125, -15.121337890625, -14.60009765625, -14.078857421875, -13.5576171875, -13.036376953125, -12.51513671875, -11.993896484375, -11.47265625, -10.951416015625, -10.43017578125, -9.908935546875, -9.3876953125, -8.866455078125, -8.34521484375, -7.823974609375, -7.302734375, -6.781494140625, -6.26025390625, -5.739013671875, -5.2177734375, -4.696533203125, -4.17529296875, -3.654052734375, -3.1328125, -2.611572265625, -2.09033203125, -1.569091796875, -1.0478515625, -0.526611328125, -0.00537109375, 0.515869140625, 1.037109375, 1.558349609375, 2.07958984375, 2.600830078125, 3.1220703125, 3.643310546875, 4.16455078125, 4.685791015625, 5.20703125, 5.728271484375, 6.24951171875, 6.770751953125, 7.2919921875, 7.813232421875, 8.33447265625, 8.855712890625, 9.376953125, 9.898193359375, 10.41943359375, 10.940673828125, 11.4619140625, 11.983154296875, 12.50439453125, 13.025634765625, 13.546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 14.0, 12.0, 38.0, 62.0, 163.0, 441.0, 1697.0, 12136.0, 957204.0, 71705.0, 3792.0, 845.0, 234.0, 99.0, 38.0, 15.0, 14.0, 12.0, 2.0, 3.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.1171875, -11.84014892578125, -11.5631103515625, -11.28607177734375, -11.009033203125, -10.73199462890625, -10.4549560546875, -10.17791748046875, -9.90087890625, -9.62384033203125, -9.3468017578125, -9.06976318359375, -8.792724609375, -8.51568603515625, -8.2386474609375, -7.96160888671875, -7.6845703125, -7.40753173828125, -7.1304931640625, -6.85345458984375, -6.576416015625, -6.29937744140625, -6.0223388671875, -5.74530029296875, -5.46826171875, -5.19122314453125, -4.9141845703125, -4.63714599609375, -4.360107421875, -4.08306884765625, -3.8060302734375, -3.52899169921875, -3.251953125, -2.97491455078125, -2.6978759765625, -2.42083740234375, -2.143798828125, -1.86676025390625, -1.5897216796875, -1.31268310546875, -1.03564453125, -0.75860595703125, -0.4815673828125, -0.20452880859375, 0.072509765625, 0.34954833984375, 0.6265869140625, 0.90362548828125, 1.1806640625, 1.45770263671875, 1.7347412109375, 2.01177978515625, 2.288818359375, 2.56585693359375, 2.8428955078125, 3.11993408203125, 3.39697265625, 3.67401123046875, 3.9510498046875, 4.22808837890625, 4.505126953125, 4.78216552734375, 5.0592041015625, 5.33624267578125, 5.61328125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 5.0, 5.0, 2.0, 2.0, 5.0, 11.0, 19.0, 27.0, 27.0, 45.0, 68.0, 131.0, 143.0, 121.0, 125.0, 78.0, 53.0, 43.0, 29.0, 18.0, 10.0, 7.0, 7.0, 5.0, 1.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0005240440368652344, -0.0005106553435325623, -0.0004972666501998901, -0.000483877956867218, -0.0004704892635345459, -0.0004571005702018738, -0.00044371187686920166, -0.00043032318353652954, -0.0004169344902038574, -0.0004035457968711853, -0.0003901571035385132, -0.00037676841020584106, -0.00036337971687316895, -0.0003499910235404968, -0.0003366023302078247, -0.0003232136368751526, -0.00030982494354248047, -0.00029643625020980835, -0.00028304755687713623, -0.0002696588635444641, -0.000256270170211792, -0.00024288147687911987, -0.00022949278354644775, -0.00021610409021377563, -0.00020271539688110352, -0.0001893267035484314, -0.00017593801021575928, -0.00016254931688308716, -0.00014916062355041504, -0.00013577193021774292, -0.0001223832368850708, -0.00010899454355239868, -9.560585021972656e-05, -8.221715688705444e-05, -6.882846355438232e-05, -5.5439770221710205e-05, -4.2051076889038086e-05, -2.8662383556365967e-05, -1.5273690223693848e-05, -1.8849968910217285e-06, 1.150369644165039e-05, 2.489238977432251e-05, 3.828108310699463e-05, 5.166977643966675e-05, 6.505846977233887e-05, 7.844716310501099e-05, 9.18358564376831e-05, 0.00010522454977035522, 0.00011861324310302734, 0.00013200193643569946, 0.00014539062976837158, 0.0001587793231010437, 0.00017216801643371582, 0.00018555670976638794, 0.00019894540309906006, 0.00021233409643173218, 0.0002257227897644043, 0.00023911148309707642, 0.00025250017642974854, 0.00026588886976242065, 0.0002792775630950928, 0.0002926662564277649, 0.000306054949760437, 0.00031944364309310913, 0.00033283233642578125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 10.0, 11.0, 14.0, 22.0, 31.0, 43.0, 71.0, 154.0, 285.0, 765.0, 3116.0, 26550.0, 960729.0, 50857.0, 4142.0, 1007.0, 351.0, 152.0, 90.0, 56.0, 29.0, 19.0, 14.0, 14.0, 8.0, 4.0, 5.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.1328125, -7.937255859375, -7.74169921875, -7.546142578125, -7.3505859375, -7.155029296875, -6.95947265625, -6.763916015625, -6.568359375, -6.372802734375, -6.17724609375, -5.981689453125, -5.7861328125, -5.590576171875, -5.39501953125, -5.199462890625, -5.00390625, -4.808349609375, -4.61279296875, -4.417236328125, -4.2216796875, -4.026123046875, -3.83056640625, -3.635009765625, -3.439453125, -3.243896484375, -3.04833984375, -2.852783203125, -2.6572265625, -2.461669921875, -2.26611328125, -2.070556640625, -1.875, -1.679443359375, -1.48388671875, -1.288330078125, -1.0927734375, -0.897216796875, -0.70166015625, -0.506103515625, -0.310546875, -0.114990234375, 0.08056640625, 0.276123046875, 0.4716796875, 0.667236328125, 0.86279296875, 1.058349609375, 1.25390625, 1.449462890625, 1.64501953125, 1.840576171875, 2.0361328125, 2.231689453125, 2.42724609375, 2.622802734375, 2.818359375, 3.013916015625, 3.20947265625, 3.405029296875, 3.6005859375, 3.796142578125, 3.99169921875, 4.187255859375, 4.3828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 9.0, 14.0, 13.0, 48.0, 105.0, 186.0, 225.0, 189.0, 112.0, 52.0, 24.0, 8.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.8756103515625, -3.641845703125, -3.4080810546875, -3.17431640625, -2.9405517578125, -2.706787109375, -2.4730224609375, -2.2392578125, -2.0054931640625, -1.771728515625, -1.5379638671875, -1.30419921875, -1.0704345703125, -0.836669921875, -0.6029052734375, -0.369140625, -0.1353759765625, 0.098388671875, 0.3321533203125, 0.56591796875, 0.7996826171875, 1.033447265625, 1.2672119140625, 1.5009765625, 1.7347412109375, 1.968505859375, 2.2022705078125, 2.43603515625, 2.6697998046875, 2.903564453125, 3.1373291015625, 3.37109375, 3.6048583984375, 3.838623046875, 4.0723876953125, 4.30615234375, 4.5399169921875, 4.773681640625, 5.0074462890625, 5.2412109375, 5.4749755859375, 5.708740234375, 5.9425048828125, 6.17626953125, 6.4100341796875, 6.643798828125, 6.8775634765625, 7.111328125, 7.3450927734375, 7.578857421875, 7.8126220703125, 8.04638671875, 8.2801513671875, 8.513916015625, 8.7476806640625, 8.9814453125, 9.2152099609375, 9.448974609375, 9.6827392578125, 9.91650390625, 10.1502685546875, 10.384033203125, 10.6177978515625, 10.8515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 13.0, 23.0, 55.0, 108.0, 223.0, 261.0, 183.0, 72.0, 34.0, 10.0, 6.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.238075256347656, -28.440683364868164, -25.643291473388672, -22.845897674560547, -20.048505783081055, -17.251113891601562, -14.453720092773438, -11.656328201293945, -8.858936309814453, -6.061543941497803, -3.2641515731811523, -0.46675872802734375, 2.3306331634521484, 5.128025054931641, 7.925418853759766, 10.722810745239258, 13.52020263671875, 16.317594528198242, 19.114986419677734, 21.91238021850586, 24.70977210998535, 27.507164001464844, 30.30455780029297, 33.101951599121094, 35.89934158325195, 38.69673538208008, 41.49412536621094, 44.29151916503906, 47.08891296386719, 49.88630294799805, 52.68369674682617, 55.48108673095703, 58.278472900390625, 61.07586669921875, 63.87325668334961, 66.670654296875, 69.4680404663086, 72.26543426513672, 75.06282806396484, 77.86022186279297, 80.65760803222656, 83.45500183105469, 86.25239562988281, 89.04978942871094, 91.84717559814453, 94.64456939697266, 97.44196319580078, 100.2393569946289, 103.03675079345703, 105.83414459228516, 108.63153839111328, 111.42892456054688, 114.226318359375, 117.02371215820312, 119.82110595703125, 122.61849975585938, 125.4158935546875, 128.21328735351562, 131.01068115234375, 133.80807495117188, 136.60546875, 139.40286254882812, 142.20025634765625, 144.9976348876953, 147.79502868652344]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 3.0, 7.0, 5.0, 10.0, 11.0, 21.0, 11.0, 16.0, 19.0, 28.0, 28.0, 34.0, 44.0, 42.0, 45.0, 51.0, 61.0, 55.0, 49.0, 58.0, 44.0, 52.0, 57.0, 42.0, 39.0, 39.0, 26.0, 20.0, 15.0, 21.0, 8.0, 10.0, 7.0, 7.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.71356964111328, -47.18662643432617, -45.65968322753906, -44.13274002075195, -42.605796813964844, -41.078853607177734, -39.551910400390625, -38.024967193603516, -36.498023986816406, -34.9710807800293, -33.44413757324219, -31.917194366455078, -30.39025115966797, -28.86330795288086, -27.33636474609375, -25.80942153930664, -24.28247833251953, -22.755535125732422, -21.228591918945312, -19.701648712158203, -18.174705505371094, -16.647762298583984, -15.120819091796875, -13.593875885009766, -12.066932678222656, -10.539989471435547, -9.013046264648438, -7.486103057861328, -5.959159851074219, -4.432216644287109, -2.9052734375, -1.3783302307128906, 0.14861297607421875, 1.6755561828613281, 3.2024993896484375, 4.729442596435547, 6.256385803222656, 7.783329010009766, 9.310272216796875, 10.837215423583984, 12.364158630371094, 13.891101837158203, 15.418045043945312, 16.944988250732422, 18.47193145751953, 19.99887466430664, 21.52581787109375, 23.05276107788086, 24.57970428466797, 26.106647491455078, 27.633590698242188, 29.160533905029297, 30.687477111816406, 32.214420318603516, 33.741363525390625, 35.268306732177734, 36.795249938964844, 38.32219314575195, 39.84913635253906, 41.37607955932617, 42.90302276611328, 44.42996597290039, 45.9569091796875, 47.48385238647461, 49.01079559326172]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 8.0, 11.0, 20.0, 22.0, 41.0, 74.0, 169.0, 364.0, 860.0, 2394.0, 10392.0, 4159645.0, 15449.0, 3023.0, 1058.0, 409.0, 167.0, 82.0, 47.0, 16.0, 12.0, 7.0, 4.0, 2.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.0625, -17.5943603515625, -17.126220703125, -16.6580810546875, -16.18994140625, -15.7218017578125, -15.253662109375, -14.7855224609375, -14.3173828125, -13.8492431640625, -13.381103515625, -12.9129638671875, -12.44482421875, -11.9766845703125, -11.508544921875, -11.0404052734375, -10.572265625, -10.1041259765625, -9.635986328125, -9.1678466796875, -8.69970703125, -8.2315673828125, -7.763427734375, -7.2952880859375, -6.8271484375, -6.3590087890625, -5.890869140625, -5.4227294921875, -4.95458984375, -4.4864501953125, -4.018310546875, -3.5501708984375, -3.08203125, -2.6138916015625, -2.145751953125, -1.6776123046875, -1.20947265625, -0.7413330078125, -0.273193359375, 0.1949462890625, 0.6630859375, 1.1312255859375, 1.599365234375, 2.0675048828125, 2.53564453125, 3.0037841796875, 3.471923828125, 3.9400634765625, 4.408203125, 4.8763427734375, 5.344482421875, 5.8126220703125, 6.28076171875, 6.7489013671875, 7.217041015625, 7.6851806640625, 8.1533203125, 8.6214599609375, 9.089599609375, 9.5577392578125, 10.02587890625, 10.4940185546875, 10.962158203125, 11.4302978515625, 11.8984375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 5.0, 13.0, 14.0, 16.0, 19.0, 22.0, 31.0, 27.0, 38.0, 51.0, 69.0, 74.0, 92.0, 71.0, 86.0, 70.0, 57.0, 43.0, 50.0, 33.0, 19.0, 21.0, 18.0, 14.0, 10.0, 5.0, 12.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.65625, -2.568267822265625, -2.48028564453125, -2.392303466796875, -2.3043212890625, -2.216339111328125, -2.12835693359375, -2.040374755859375, -1.952392578125, -1.864410400390625, -1.77642822265625, -1.688446044921875, -1.6004638671875, -1.512481689453125, -1.42449951171875, -1.336517333984375, -1.24853515625, -1.160552978515625, -1.07257080078125, -0.984588623046875, -0.8966064453125, -0.808624267578125, -0.72064208984375, -0.632659912109375, -0.544677734375, -0.456695556640625, -0.36871337890625, -0.280731201171875, -0.1927490234375, -0.104766845703125, -0.01678466796875, 0.071197509765625, 0.1591796875, 0.247161865234375, 0.33514404296875, 0.423126220703125, 0.5111083984375, 0.599090576171875, 0.68707275390625, 0.775054931640625, 0.863037109375, 0.951019287109375, 1.03900146484375, 1.126983642578125, 1.2149658203125, 1.302947998046875, 1.39093017578125, 1.478912353515625, 1.56689453125, 1.654876708984375, 1.74285888671875, 1.830841064453125, 1.9188232421875, 2.006805419921875, 2.09478759765625, 2.182769775390625, 2.270751953125, 2.358734130859375, 2.44671630859375, 2.534698486328125, 2.6226806640625, 2.710662841796875, 2.79864501953125, 2.886627197265625, 2.974609375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 1.0, 4.0, 6.0, 9.0, 12.0, 8.0, 15.0, 17.0, 23.0, 33.0, 47.0, 68.0, 91.0, 110.0, 198.0, 305.0, 500.0, 822.0, 1434.0, 2977.0, 7489.0, 53257.0, 4101445.0, 16251.0, 4327.0, 1990.0, 1092.0, 605.0, 372.0, 230.0, 157.0, 101.0, 87.0, 54.0, 37.0, 33.0, 17.0, 12.0, 11.0, 4.0, 4.0, 9.0, 8.0, 2.0, 6.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0859375, -8.78564453125, -8.4853515625, -8.18505859375, -7.884765625, -7.58447265625, -7.2841796875, -6.98388671875, -6.68359375, -6.38330078125, -6.0830078125, -5.78271484375, -5.482421875, -5.18212890625, -4.8818359375, -4.58154296875, -4.28125, -3.98095703125, -3.6806640625, -3.38037109375, -3.080078125, -2.77978515625, -2.4794921875, -2.17919921875, -1.87890625, -1.57861328125, -1.2783203125, -0.97802734375, -0.677734375, -0.37744140625, -0.0771484375, 0.22314453125, 0.5234375, 0.82373046875, 1.1240234375, 1.42431640625, 1.724609375, 2.02490234375, 2.3251953125, 2.62548828125, 2.92578125, 3.22607421875, 3.5263671875, 3.82666015625, 4.126953125, 4.42724609375, 4.7275390625, 5.02783203125, 5.328125, 5.62841796875, 5.9287109375, 6.22900390625, 6.529296875, 6.82958984375, 7.1298828125, 7.43017578125, 7.73046875, 8.03076171875, 8.3310546875, 8.63134765625, 8.931640625, 9.23193359375, 9.5322265625, 9.83251953125, 10.1328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 6.0, 5.0, 11.0, 32.0, 72.0, 3875.0, 48.0, 14.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1484375, -4.04296875, -3.9375, -3.83203125, -3.7265625, -3.62109375, -3.515625, -3.41015625, -3.3046875, -3.19921875, -3.09375, -2.98828125, -2.8828125, -2.77734375, -2.671875, -2.56640625, -2.4609375, -2.35546875, -2.25, -2.14453125, -2.0390625, -1.93359375, -1.828125, -1.72265625, -1.6171875, -1.51171875, -1.40625, -1.30078125, -1.1953125, -1.08984375, -0.984375, -0.87890625, -0.7734375, -0.66796875, -0.5625, -0.45703125, -0.3515625, -0.24609375, -0.140625, -0.03515625, 0.0703125, 0.17578125, 0.28125, 0.38671875, 0.4921875, 0.59765625, 0.703125, 0.80859375, 0.9140625, 1.01953125, 1.125, 1.23046875, 1.3359375, 1.44140625, 1.546875, 1.65234375, 1.7578125, 1.86328125, 1.96875, 2.07421875, 2.1796875, 2.28515625, 2.390625, 2.49609375, 2.6015625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 6.0, 4.0, 40.0, 197.0, 508.0, 223.0, 29.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.544151306152344, -24.789398193359375, -24.03464698791504, -23.27989387512207, -22.5251407623291, -21.770387649536133, -21.015636444091797, -20.260883331298828, -19.50613021850586, -18.75137710571289, -17.996625900268555, -17.241872787475586, -16.487119674682617, -15.732367515563965, -14.977615356445312, -14.222862243652344, -13.468110084533691, -12.713357925415039, -11.95860481262207, -11.203852653503418, -10.44909954071045, -9.694347381591797, -8.939594268798828, -8.184842109680176, -7.430089473724365, -6.675336837768555, -5.920584201812744, -5.165831565856934, -4.411079406738281, -3.6563265323638916, -2.90157413482666, -2.1468214988708496, -1.392068862915039, -0.6373162865638733, 0.11743628978729248, 0.8721888065338135, 1.626941442489624, 2.3816940784454346, 3.136446475982666, 3.8911991119384766, 4.645951747894287, 5.400704383850098, 6.155457019805908, 6.910209655761719, 7.664961814880371, 8.41971492767334, 9.174467086791992, 9.929220199584961, 10.683972358703613, 11.438724517822266, 12.193477630615234, 12.948229789733887, 13.702982902526855, 14.457735061645508, 15.212488174438477, 15.967240333557129, 16.72199249267578, 17.47674560546875, 18.231496810913086, 18.986249923706055, 19.741003036499023, 20.495756149291992, 21.250507354736328, 22.005260467529297, 22.760013580322266]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 0.0, 3.0, 3.0, 8.0, 8.0, 11.0, 15.0, 20.0, 26.0, 31.0, 36.0, 37.0, 38.0, 53.0, 56.0, 44.0, 38.0, 55.0, 46.0, 58.0, 44.0, 53.0, 49.0, 42.0, 44.0, 35.0, 28.0, 20.0, 25.0, 19.0, 17.0, 10.0, 12.0, 6.0, 4.0, 5.0, 1.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2756781578063965, -4.127501487731934, -3.9793245792388916, -3.8311476707458496, -3.6829710006713867, -3.534794330596924, -3.386617422103882, -3.23844051361084, -3.090263843536377, -2.942087173461914, -2.793910264968872, -2.64573335647583, -2.497556686401367, -2.3493800163269043, -2.2012031078338623, -2.0530261993408203, -1.9048495292663574, -1.756672739982605, -1.6084959506988525, -1.4603191614151, -1.3121423721313477, -1.1639655828475952, -1.0157887935638428, -0.8676120042800903, -0.7194352149963379, -0.5712584257125854, -0.423081636428833, -0.27490484714508057, -0.12672805786132812, 0.021448731422424316, 0.16962552070617676, 0.3178023099899292, 0.46597957611083984, 0.6141563653945923, 0.7623331546783447, 0.9105099439620972, 1.0586867332458496, 1.206863522529602, 1.3550403118133545, 1.503217101097107, 1.6513938903808594, 1.7995706796646118, 1.9477474689483643, 2.0959243774414062, 2.244101047515869, 2.392277717590332, 2.540454626083374, 2.688631534576416, 2.836808204650879, 2.984984874725342, 3.133161783218384, 3.281338691711426, 3.4295153617858887, 3.5776920318603516, 3.7258689403533936, 3.8740458488464355, 4.022222518920898, 4.170399188995361, 4.318575859069824, 4.466753005981445, 4.614929676055908, 4.763106346130371, 4.911283493041992, 5.059460163116455, 5.207636833190918]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 2.0, 10.0, 8.0, 10.0, 17.0, 35.0, 38.0, 56.0, 85.0, 150.0, 218.0, 365.0, 681.0, 1181.0, 2265.0, 4462.0, 9493.0, 21505.0, 53792.0, 152892.0, 374985.0, 269210.0, 93541.0, 34900.0, 14732.0, 6670.0, 3303.0, 1746.0, 908.0, 536.0, 272.0, 175.0, 114.0, 61.0, 51.0, 37.0, 16.0, 16.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.27734375, -4.167022705078125, -4.05670166015625, -3.946380615234375, -3.8360595703125, -3.725738525390625, -3.61541748046875, -3.505096435546875, -3.394775390625, -3.284454345703125, -3.17413330078125, -3.063812255859375, -2.9534912109375, -2.843170166015625, -2.73284912109375, -2.622528076171875, -2.51220703125, -2.401885986328125, -2.29156494140625, -2.181243896484375, -2.0709228515625, -1.960601806640625, -1.85028076171875, -1.739959716796875, -1.629638671875, -1.519317626953125, -1.40899658203125, -1.298675537109375, -1.1883544921875, -1.078033447265625, -0.96771240234375, -0.857391357421875, -0.7470703125, -0.636749267578125, -0.52642822265625, -0.416107177734375, -0.3057861328125, -0.195465087890625, -0.08514404296875, 0.025177001953125, 0.135498046875, 0.245819091796875, 0.35614013671875, 0.466461181640625, 0.5767822265625, 0.687103271484375, 0.79742431640625, 0.907745361328125, 1.01806640625, 1.128387451171875, 1.23870849609375, 1.349029541015625, 1.4593505859375, 1.569671630859375, 1.67999267578125, 1.790313720703125, 1.900634765625, 2.010955810546875, 2.12127685546875, 2.231597900390625, 2.3419189453125, 2.452239990234375, 2.56256103515625, 2.672882080078125, 2.783203125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 7.0, 13.0, 14.0, 12.0, 19.0, 22.0, 30.0, 42.0, 53.0, 47.0, 68.0, 75.0, 79.0, 76.0, 76.0, 68.0, 50.0, 47.0, 45.0, 38.0, 26.0, 22.0, 17.0, 13.0, 13.0, 8.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.304290771484375, -2.21600341796875, -2.127716064453125, -2.0394287109375, -1.951141357421875, -1.86285400390625, -1.774566650390625, -1.686279296875, -1.597991943359375, -1.50970458984375, -1.421417236328125, -1.3331298828125, -1.244842529296875, -1.15655517578125, -1.068267822265625, -0.97998046875, -0.891693115234375, -0.80340576171875, -0.715118408203125, -0.6268310546875, -0.538543701171875, -0.45025634765625, -0.361968994140625, -0.273681640625, -0.185394287109375, -0.09710693359375, -0.008819580078125, 0.0794677734375, 0.167755126953125, 0.25604248046875, 0.344329833984375, 0.4326171875, 0.520904541015625, 0.60919189453125, 0.697479248046875, 0.7857666015625, 0.874053955078125, 0.96234130859375, 1.050628662109375, 1.138916015625, 1.227203369140625, 1.31549072265625, 1.403778076171875, 1.4920654296875, 1.580352783203125, 1.66864013671875, 1.756927490234375, 1.84521484375, 1.933502197265625, 2.02178955078125, 2.110076904296875, 2.1983642578125, 2.286651611328125, 2.37493896484375, 2.463226318359375, 2.551513671875, 2.639801025390625, 2.72808837890625, 2.816375732421875, 2.9046630859375, 2.992950439453125, 3.08123779296875, 3.169525146484375, 3.2578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 12.0, 7.0, 13.0, 21.0, 21.0, 29.0, 51.0, 56.0, 87.0, 156.0, 324.0, 643.0, 1485.0, 4492.0, 19307.0, 141644.0, 722680.0, 132088.0, 18208.0, 4490.0, 1389.0, 609.0, 256.0, 141.0, 91.0, 69.0, 49.0, 40.0, 22.0, 21.0, 15.0, 15.0, 10.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.6796875, -6.467529296875, -6.25537109375, -6.043212890625, -5.8310546875, -5.618896484375, -5.40673828125, -5.194580078125, -4.982421875, -4.770263671875, -4.55810546875, -4.345947265625, -4.1337890625, -3.921630859375, -3.70947265625, -3.497314453125, -3.28515625, -3.072998046875, -2.86083984375, -2.648681640625, -2.4365234375, -2.224365234375, -2.01220703125, -1.800048828125, -1.587890625, -1.375732421875, -1.16357421875, -0.951416015625, -0.7392578125, -0.527099609375, -0.31494140625, -0.102783203125, 0.109375, 0.321533203125, 0.53369140625, 0.745849609375, 0.9580078125, 1.170166015625, 1.38232421875, 1.594482421875, 1.806640625, 2.018798828125, 2.23095703125, 2.443115234375, 2.6552734375, 2.867431640625, 3.07958984375, 3.291748046875, 3.50390625, 3.716064453125, 3.92822265625, 4.140380859375, 4.3525390625, 4.564697265625, 4.77685546875, 4.989013671875, 5.201171875, 5.413330078125, 5.62548828125, 5.837646484375, 6.0498046875, 6.261962890625, 6.47412109375, 6.686279296875, 6.8984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 10.0, 13.0, 23.0, 17.0, 31.0, 43.0, 42.0, 92.0, 55.0, 85.0, 70.0, 76.0, 86.0, 69.0, 69.0, 60.0, 44.0, 27.0, 17.0, 25.0, 12.0, 11.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.984375, -15.468994140625, -14.95361328125, -14.438232421875, -13.9228515625, -13.407470703125, -12.89208984375, -12.376708984375, -11.861328125, -11.345947265625, -10.83056640625, -10.315185546875, -9.7998046875, -9.284423828125, -8.76904296875, -8.253662109375, -7.73828125, -7.222900390625, -6.70751953125, -6.192138671875, -5.6767578125, -5.161376953125, -4.64599609375, -4.130615234375, -3.615234375, -3.099853515625, -2.58447265625, -2.069091796875, -1.5537109375, -1.038330078125, -0.52294921875, -0.007568359375, 0.5078125, 1.023193359375, 1.53857421875, 2.053955078125, 2.5693359375, 3.084716796875, 3.60009765625, 4.115478515625, 4.630859375, 5.146240234375, 5.66162109375, 6.177001953125, 6.6923828125, 7.207763671875, 7.72314453125, 8.238525390625, 8.75390625, 9.269287109375, 9.78466796875, 10.300048828125, 10.8154296875, 11.330810546875, 11.84619140625, 12.361572265625, 12.876953125, 13.392333984375, 13.90771484375, 14.423095703125, 14.9384765625, 15.453857421875, 15.96923828125, 16.484619140625, 17.0]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 5.0, 3.0, 3.0, 9.0, 13.0, 46.0, 168.0, 1026.0, 239478.0, 806156.0, 1324.0, 215.0, 58.0, 23.0, 15.0, 8.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4453125, -7.8841552734375, -7.322998046875, -6.7618408203125, -6.20068359375, -5.6395263671875, -5.078369140625, -4.5172119140625, -3.9560546875, -3.3948974609375, -2.833740234375, -2.2725830078125, -1.71142578125, -1.1502685546875, -0.589111328125, -0.0279541015625, 0.533203125, 1.0943603515625, 1.655517578125, 2.2166748046875, 2.77783203125, 3.3389892578125, 3.900146484375, 4.4613037109375, 5.0224609375, 5.5836181640625, 6.144775390625, 6.7059326171875, 7.26708984375, 7.8282470703125, 8.389404296875, 8.9505615234375, 9.51171875, 10.0728759765625, 10.634033203125, 11.1951904296875, 11.75634765625, 12.3175048828125, 12.878662109375, 13.4398193359375, 14.0009765625, 14.5621337890625, 15.123291015625, 15.6844482421875, 16.24560546875, 16.8067626953125, 17.367919921875, 17.9290771484375, 18.490234375, 19.0513916015625, 19.612548828125, 20.1737060546875, 20.73486328125, 21.2960205078125, 21.857177734375, 22.4183349609375, 22.9794921875, 23.5406494140625, 24.101806640625, 24.6629638671875, 25.22412109375, 25.7852783203125, 26.346435546875, 26.9075927734375, 27.46875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 7.0, 19.0, 14.0, 26.0, 35.0, 65.0, 80.0, 125.0, 124.0, 130.0, 95.0, 93.0, 46.0, 38.0, 22.0, 13.0, 18.0, 11.0, 9.0, 6.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006189346313476562, -0.000603456050157547, -0.0005879774689674377, -0.0005724988877773285, -0.0005570203065872192, -0.00054154172539711, -0.0005260631442070007, -0.0005105845630168915, -0.0004951059818267822, -0.000479627400636673, -0.0004641488194465637, -0.00044867023825645447, -0.0004331916570663452, -0.00041771307587623596, -0.0004022344946861267, -0.00038675591349601746, -0.0003712773323059082, -0.00035579875111579895, -0.0003403201699256897, -0.00032484158873558044, -0.0003093630075454712, -0.00029388442635536194, -0.0002784058451652527, -0.00026292726397514343, -0.0002474486827850342, -0.00023197010159492493, -0.00021649152040481567, -0.00020101293921470642, -0.00018553435802459717, -0.00017005577683448792, -0.00015457719564437866, -0.0001390986144542694, -0.00012362003326416016, -0.0001081414520740509, -9.266287088394165e-05, -7.71842896938324e-05, -6.170570850372314e-05, -4.622712731361389e-05, -3.074854612350464e-05, -1.5269964933395386e-05, 2.086162567138672e-07, 1.568719744682312e-05, 3.116577863693237e-05, 4.6644359827041626e-05, 6.212294101715088e-05, 7.760152220726013e-05, 9.308010339736938e-05, 0.00010855868458747864, 0.0001240372657775879, 0.00013951584696769714, 0.0001549944281578064, 0.00017047300934791565, 0.0001859515905380249, 0.00020143017172813416, 0.0002169087529182434, 0.00023238733410835266, 0.0002478659152984619, 0.00026334449648857117, 0.0002788230776786804, 0.00029430165886878967, 0.0003097802400588989, 0.0003252588212490082, 0.00034073740243911743, 0.0003562159836292267, 0.00037169456481933594]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 9.0, 9.0, 20.0, 19.0, 57.0, 91.0, 208.0, 416.0, 1247.0, 5160.0, 55908.0, 928504.0, 50002.0, 4875.0, 1234.0, 390.0, 195.0, 98.0, 47.0, 18.0, 16.0, 14.0, 8.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.88958740234375, -4.7049560546875, -4.52032470703125, -4.335693359375, -4.15106201171875, -3.9664306640625, -3.78179931640625, -3.59716796875, -3.41253662109375, -3.2279052734375, -3.04327392578125, -2.858642578125, -2.67401123046875, -2.4893798828125, -2.30474853515625, -2.1201171875, -1.93548583984375, -1.7508544921875, -1.56622314453125, -1.381591796875, -1.19696044921875, -1.0123291015625, -0.82769775390625, -0.64306640625, -0.45843505859375, -0.2738037109375, -0.08917236328125, 0.095458984375, 0.28009033203125, 0.4647216796875, 0.64935302734375, 0.833984375, 1.01861572265625, 1.2032470703125, 1.38787841796875, 1.572509765625, 1.75714111328125, 1.9417724609375, 2.12640380859375, 2.31103515625, 2.49566650390625, 2.6802978515625, 2.86492919921875, 3.049560546875, 3.23419189453125, 3.4188232421875, 3.60345458984375, 3.7880859375, 3.97271728515625, 4.1573486328125, 4.34197998046875, 4.526611328125, 4.71124267578125, 4.8958740234375, 5.08050537109375, 5.26513671875, 5.44976806640625, 5.6343994140625, 5.81903076171875, 6.003662109375, 6.18829345703125, 6.3729248046875, 6.55755615234375, 6.7421875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 8.0, 3.0, 12.0, 11.0, 29.0, 47.0, 115.0, 185.0, 221.0, 176.0, 95.0, 42.0, 16.0, 11.0, 10.0, 6.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.171875, -6.899658203125, -6.62744140625, -6.355224609375, -6.0830078125, -5.810791015625, -5.53857421875, -5.266357421875, -4.994140625, -4.721923828125, -4.44970703125, -4.177490234375, -3.9052734375, -3.633056640625, -3.36083984375, -3.088623046875, -2.81640625, -2.544189453125, -2.27197265625, -1.999755859375, -1.7275390625, -1.455322265625, -1.18310546875, -0.910888671875, -0.638671875, -0.366455078125, -0.09423828125, 0.177978515625, 0.4501953125, 0.722412109375, 0.99462890625, 1.266845703125, 1.5390625, 1.811279296875, 2.08349609375, 2.355712890625, 2.6279296875, 2.900146484375, 3.17236328125, 3.444580078125, 3.716796875, 3.989013671875, 4.26123046875, 4.533447265625, 4.8056640625, 5.077880859375, 5.35009765625, 5.622314453125, 5.89453125, 6.166748046875, 6.43896484375, 6.711181640625, 6.9833984375, 7.255615234375, 7.52783203125, 7.800048828125, 8.072265625, 8.344482421875, 8.61669921875, 8.888916015625, 9.1611328125, 9.433349609375, 9.70556640625, 9.977783203125, 10.25]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 8.0, 8.0, 45.0, 170.0, 372.0, 287.0, 93.0, 20.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.10096740722656, -97.19606018066406, -93.2911605834961, -89.3862533569336, -85.48135375976562, -81.57644653320312, -77.67153930664062, -73.76663970947266, -69.86174011230469, -65.95683288574219, -62.05193328857422, -58.14702606201172, -54.24212646484375, -50.33721923828125, -46.432315826416016, -42.52741241455078, -38.62250518798828, -34.71760177612305, -30.812698364257812, -26.907793045043945, -23.00288963317871, -19.097986221313477, -15.19308090209961, -11.288177490234375, -7.383274078369141, -3.478370189666748, 0.42653369903564453, 4.331438064575195, 8.23634147644043, 12.141244888305664, 16.04615020751953, 19.951053619384766, 23.85595703125, 27.760860443115234, 31.66576385498047, 35.57067108154297, 39.47557067871094, 43.38047790527344, 47.28538131713867, 51.190284729003906, 55.09518814086914, 59.000091552734375, 62.90499496459961, 66.80989837646484, 70.71480560302734, 74.61970520019531, 78.52461242675781, 82.42951965332031, 86.33441925048828, 90.23932647705078, 94.14422607421875, 98.04913330078125, 101.95403289794922, 105.85894012451172, 109.76383972167969, 113.66874694824219, 117.57365417480469, 121.47856140136719, 125.38346099853516, 129.28836059570312, 133.19326782226562, 137.09817504882812, 141.00308227539062, 144.90798950195312, 148.81288146972656]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 4.0, 0.0, 4.0, 7.0, 4.0, 4.0, 10.0, 14.0, 6.0, 25.0, 23.0, 19.0, 34.0, 40.0, 42.0, 34.0, 56.0, 42.0, 58.0, 62.0, 54.0, 62.0, 40.0, 52.0, 55.0, 43.0, 34.0, 36.0, 27.0, 18.0, 16.0, 15.0, 16.0, 20.0, 8.0, 6.0, 5.0, 6.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0], "bins": [-64.59442138671875, -62.9588623046875, -61.32330322265625, -59.687744140625, -58.05218505859375, -56.4166259765625, -54.781063079833984, -53.145503997802734, -51.509944915771484, -49.874385833740234, -48.238826751708984, -46.603267669677734, -44.96770477294922, -43.33214569091797, -41.69658660888672, -40.06102752685547, -38.42546844482422, -36.78990936279297, -35.15435028076172, -33.51879119873047, -31.883230209350586, -30.247671127319336, -28.612110137939453, -26.976551055908203, -25.340991973876953, -23.705432891845703, -22.069873809814453, -20.43431282043457, -18.79875373840332, -17.16319465637207, -15.527634620666504, -13.892074584960938, -12.256511688232422, -10.620952606201172, -8.985392570495605, -7.349833011627197, -5.714273452758789, -4.078714370727539, -2.4431543350219727, -0.8075942993164062, 0.8279647827148438, 2.463524341583252, 4.09908390045166, 5.734643459320068, 7.370203018188477, 9.005762100219727, 10.641322135925293, 12.27688217163086, 13.91244125366211, 15.54800033569336, 17.18355941772461, 18.819120407104492, 20.454679489135742, 22.090238571166992, 23.725799560546875, 25.361358642578125, 26.996917724609375, 28.632476806640625, 30.268035888671875, 31.903596878051758, 33.539154052734375, 35.174713134765625, 36.81027603149414, 38.44583511352539, 40.08139419555664]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 1.0, 7.0, 5.0, 20.0, 21.0, 33.0, 34.0, 54.0, 102.0, 199.0, 400.0, 885.0, 2534.0, 11905.0, 4085020.0, 83534.0, 6527.0, 1711.0, 658.0, 275.0, 143.0, 74.0, 56.0, 30.0, 17.0, 11.0, 7.0, 3.0, 4.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5078125, -12.1856689453125, -11.863525390625, -11.5413818359375, -11.21923828125, -10.8970947265625, -10.574951171875, -10.2528076171875, -9.9306640625, -9.6085205078125, -9.286376953125, -8.9642333984375, -8.64208984375, -8.3199462890625, -7.997802734375, -7.6756591796875, -7.353515625, -7.0313720703125, -6.709228515625, -6.3870849609375, -6.06494140625, -5.7427978515625, -5.420654296875, -5.0985107421875, -4.7763671875, -4.4542236328125, -4.132080078125, -3.8099365234375, -3.48779296875, -3.1656494140625, -2.843505859375, -2.5213623046875, -2.19921875, -1.8770751953125, -1.554931640625, -1.2327880859375, -0.91064453125, -0.5885009765625, -0.266357421875, 0.0557861328125, 0.3779296875, 0.7000732421875, 1.022216796875, 1.3443603515625, 1.66650390625, 1.9886474609375, 2.310791015625, 2.6329345703125, 2.955078125, 3.2772216796875, 3.599365234375, 3.9215087890625, 4.24365234375, 4.5657958984375, 4.887939453125, 5.2100830078125, 5.5322265625, 5.8543701171875, 6.176513671875, 6.4986572265625, 6.82080078125, 7.1429443359375, 7.465087890625, 7.7872314453125, 8.109375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 6.0, 10.0, 7.0, 17.0, 12.0, 21.0, 28.0, 40.0, 45.0, 64.0, 69.0, 101.0, 83.0, 96.0, 61.0, 75.0, 63.0, 53.0, 37.0, 33.0, 20.0, 17.0, 11.0, 7.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.21875, -3.128387451171875, -3.03802490234375, -2.947662353515625, -2.8572998046875, -2.766937255859375, -2.67657470703125, -2.586212158203125, -2.495849609375, -2.405487060546875, -2.31512451171875, -2.224761962890625, -2.1343994140625, -2.044036865234375, -1.95367431640625, -1.863311767578125, -1.77294921875, -1.682586669921875, -1.59222412109375, -1.501861572265625, -1.4114990234375, -1.321136474609375, -1.23077392578125, -1.140411376953125, -1.050048828125, -0.959686279296875, -0.86932373046875, -0.778961181640625, -0.6885986328125, -0.598236083984375, -0.50787353515625, -0.417510986328125, -0.3271484375, -0.236785888671875, -0.14642333984375, -0.056060791015625, 0.0343017578125, 0.124664306640625, 0.21502685546875, 0.305389404296875, 0.395751953125, 0.486114501953125, 0.57647705078125, 0.666839599609375, 0.7572021484375, 0.847564697265625, 0.93792724609375, 1.028289794921875, 1.11865234375, 1.209014892578125, 1.29937744140625, 1.389739990234375, 1.4801025390625, 1.570465087890625, 1.66082763671875, 1.751190185546875, 1.841552734375, 1.931915283203125, 2.02227783203125, 2.112640380859375, 2.2030029296875, 2.293365478515625, 2.38372802734375, 2.474090576171875, 2.564453125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 6.0, 4.0, 5.0, 8.0, 10.0, 12.0, 18.0, 33.0, 53.0, 48.0, 77.0, 121.0, 120.0, 152.0, 225.0, 330.0, 806.0, 6049.0, 4140605.0, 42189.0, 1864.0, 505.0, 267.0, 164.0, 140.0, 99.0, 103.0, 73.0, 53.0, 43.0, 24.0, 21.0, 22.0, 9.0, 10.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.828125, -18.124267578125, -17.42041015625, -16.716552734375, -16.0126953125, -15.308837890625, -14.60498046875, -13.901123046875, -13.197265625, -12.493408203125, -11.78955078125, -11.085693359375, -10.3818359375, -9.677978515625, -8.97412109375, -8.270263671875, -7.56640625, -6.862548828125, -6.15869140625, -5.454833984375, -4.7509765625, -4.047119140625, -3.34326171875, -2.639404296875, -1.935546875, -1.231689453125, -0.52783203125, 0.176025390625, 0.8798828125, 1.583740234375, 2.28759765625, 2.991455078125, 3.6953125, 4.399169921875, 5.10302734375, 5.806884765625, 6.5107421875, 7.214599609375, 7.91845703125, 8.622314453125, 9.326171875, 10.030029296875, 10.73388671875, 11.437744140625, 12.1416015625, 12.845458984375, 13.54931640625, 14.253173828125, 14.95703125, 15.660888671875, 16.36474609375, 17.068603515625, 17.7724609375, 18.476318359375, 19.18017578125, 19.884033203125, 20.587890625, 21.291748046875, 21.99560546875, 22.699462890625, 23.4033203125, 24.107177734375, 24.81103515625, 25.514892578125, 26.21875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 13.0, 17.0, 51.0, 684.0, 3245.0, 50.0, 9.0, 7.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.55584716796875, -4.2718505859375, -3.98785400390625, -3.703857421875, -3.41986083984375, -3.1358642578125, -2.85186767578125, -2.56787109375, -2.28387451171875, -1.9998779296875, -1.71588134765625, -1.431884765625, -1.14788818359375, -0.8638916015625, -0.57989501953125, -0.2958984375, -0.01190185546875, 0.2720947265625, 0.55609130859375, 0.840087890625, 1.12408447265625, 1.4080810546875, 1.69207763671875, 1.97607421875, 2.26007080078125, 2.5440673828125, 2.82806396484375, 3.112060546875, 3.39605712890625, 3.6800537109375, 3.96405029296875, 4.248046875, 4.53204345703125, 4.8160400390625, 5.10003662109375, 5.384033203125, 5.66802978515625, 5.9520263671875, 6.23602294921875, 6.52001953125, 6.80401611328125, 7.0880126953125, 7.37200927734375, 7.656005859375, 7.94000244140625, 8.2239990234375, 8.50799560546875, 8.7919921875, 9.07598876953125, 9.3599853515625, 9.64398193359375, 9.927978515625, 10.21197509765625, 10.4959716796875, 10.77996826171875, 11.06396484375, 11.34796142578125, 11.6319580078125, 11.91595458984375, 12.199951171875, 12.48394775390625, 12.7679443359375, 13.05194091796875, 13.3359375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 6.0, 3.0, 2.0, 14.0, 24.0, 81.0, 291.0, 386.0, 141.0, 39.0, 14.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.62700843811035, -29.208858489990234, -27.79071044921875, -26.372560501098633, -24.954410552978516, -23.5362606048584, -22.11811065673828, -20.699962615966797, -19.28181266784668, -17.863662719726562, -16.445514678955078, -15.027364730834961, -13.609214782714844, -12.191064834594727, -10.772915840148926, -9.354766845703125, -7.936616897583008, -6.518467426300049, -5.10031795501709, -3.682168483734131, -2.264019012451172, -0.8458695411682129, 0.5722799301147461, 1.9904289245605469, 3.408578872680664, 4.826728343963623, 6.244877815246582, 7.663027286529541, 9.0811767578125, 10.499326705932617, 11.917475700378418, 13.335624694824219, 14.753776550292969, 16.171926498413086, 17.590076446533203, 19.008224487304688, 20.426374435424805, 21.844524383544922, 23.262672424316406, 24.680822372436523, 26.09897232055664, 27.517122268676758, 28.935272216796875, 30.35342025756836, 31.771570205688477, 33.189720153808594, 34.60786819458008, 36.02601623535156, 37.44416809082031, 38.8623161315918, 40.28046798706055, 41.69861602783203, 43.11676788330078, 44.534915924072266, 45.95306396484375, 47.3712158203125, 48.789363861083984, 50.20751190185547, 51.62566375732422, 53.0438117980957, 54.46195983886719, 55.88011169433594, 57.29825973510742, 58.716407775878906, 60.134559631347656]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 6.0, 11.0, 17.0, 19.0, 34.0, 42.0, 55.0, 62.0, 63.0, 75.0, 89.0, 82.0, 85.0, 61.0, 71.0, 44.0, 44.0, 26.0, 25.0, 17.0, 20.0, 13.0, 10.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.907756805419922, -23.20425796508789, -22.50075912475586, -21.797260284423828, -21.093761444091797, -20.390260696411133, -19.6867618560791, -18.98326301574707, -18.27976417541504, -17.576265335083008, -16.872766494750977, -16.169267654418945, -15.465767860412598, -14.762269020080566, -14.058769226074219, -13.355270385742188, -12.651771545410156, -11.948272705078125, -11.244773864746094, -10.541274070739746, -9.837775230407715, -9.134276390075684, -8.430776596069336, -7.727277755737305, -7.023778915405273, -6.320280075073242, -5.616780757904053, -4.913281440734863, -4.209782600402832, -3.5062835216522217, -2.8027844429016113, -2.099285125732422, -1.3957862854003906, -0.6922872066497803, 0.011211872100830078, 0.7147109508514404, 1.4182100296020508, 2.121709108352661, 2.8252081871032715, 3.528707504272461, 4.232206344604492, 4.935705184936523, 5.639204502105713, 6.342703819274902, 7.046202659606934, 7.749701499938965, 8.453201293945312, 9.156700134277344, 9.860198974609375, 10.563697814941406, 11.267196655273438, 11.970696449279785, 12.674195289611816, 13.377694129943848, 14.081193923950195, 14.784692764282227, 15.488191604614258, 16.19169044494629, 16.89518928527832, 17.59868812561035, 18.302188873291016, 19.005687713623047, 19.709186553955078, 20.41268539428711, 21.11618423461914]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 5.0, 12.0, 14.0, 22.0, 15.0, 24.0, 45.0, 61.0, 67.0, 134.0, 239.0, 438.0, 875.0, 2165.0, 6326.0, 25971.0, 166696.0, 659053.0, 152332.0, 24039.0, 5982.0, 2031.0, 907.0, 452.0, 260.0, 125.0, 98.0, 50.0, 37.0, 20.0, 14.0, 12.0, 10.0, 6.0, 6.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.59765625, -6.3880615234375, -6.178466796875, -5.9688720703125, -5.75927734375, -5.5496826171875, -5.340087890625, -5.1304931640625, -4.9208984375, -4.7113037109375, -4.501708984375, -4.2921142578125, -4.08251953125, -3.8729248046875, -3.663330078125, -3.4537353515625, -3.244140625, -3.0345458984375, -2.824951171875, -2.6153564453125, -2.40576171875, -2.1961669921875, -1.986572265625, -1.7769775390625, -1.5673828125, -1.3577880859375, -1.148193359375, -0.9385986328125, -0.72900390625, -0.5194091796875, -0.309814453125, -0.1002197265625, 0.109375, 0.3189697265625, 0.528564453125, 0.7381591796875, 0.94775390625, 1.1573486328125, 1.366943359375, 1.5765380859375, 1.7861328125, 1.9957275390625, 2.205322265625, 2.4149169921875, 2.62451171875, 2.8341064453125, 3.043701171875, 3.2532958984375, 3.462890625, 3.6724853515625, 3.882080078125, 4.0916748046875, 4.30126953125, 4.5108642578125, 4.720458984375, 4.9300537109375, 5.1396484375, 5.3492431640625, 5.558837890625, 5.7684326171875, 5.97802734375, 6.1876220703125, 6.397216796875, 6.6068115234375, 6.81640625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 10.0, 9.0, 12.0, 22.0, 20.0, 25.0, 30.0, 46.0, 68.0, 63.0, 75.0, 77.0, 73.0, 84.0, 63.0, 66.0, 54.0, 45.0, 38.0, 27.0, 16.0, 19.0, 16.0, 6.0, 8.0, 7.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.884765625, -2.783050537109375, -2.68133544921875, -2.579620361328125, -2.4779052734375, -2.376190185546875, -2.27447509765625, -2.172760009765625, -2.071044921875, -1.969329833984375, -1.86761474609375, -1.765899658203125, -1.6641845703125, -1.562469482421875, -1.46075439453125, -1.359039306640625, -1.25732421875, -1.155609130859375, -1.05389404296875, -0.952178955078125, -0.8504638671875, -0.748748779296875, -0.64703369140625, -0.545318603515625, -0.443603515625, -0.341888427734375, -0.24017333984375, -0.138458251953125, -0.0367431640625, 0.064971923828125, 0.16668701171875, 0.268402099609375, 0.3701171875, 0.471832275390625, 0.57354736328125, 0.675262451171875, 0.7769775390625, 0.878692626953125, 0.98040771484375, 1.082122802734375, 1.183837890625, 1.285552978515625, 1.38726806640625, 1.488983154296875, 1.5906982421875, 1.692413330078125, 1.79412841796875, 1.895843505859375, 1.99755859375, 2.099273681640625, 2.20098876953125, 2.302703857421875, 2.4044189453125, 2.506134033203125, 2.60784912109375, 2.709564208984375, 2.811279296875, 2.912994384765625, 3.01470947265625, 3.116424560546875, 3.2181396484375, 3.319854736328125, 3.42156982421875, 3.523284912109375, 3.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 5.0, 5.0, 21.0, 31.0, 66.0, 182.0, 526.0, 3685.0, 940051.0, 101772.0, 1669.0, 330.0, 127.0, 41.0, 27.0, 15.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.1875, -33.2060546875, -32.224609375, -31.2431640625, -30.26171875, -29.2802734375, -28.298828125, -27.3173828125, -26.3359375, -25.3544921875, -24.373046875, -23.3916015625, -22.41015625, -21.4287109375, -20.447265625, -19.4658203125, -18.484375, -17.5029296875, -16.521484375, -15.5400390625, -14.55859375, -13.5771484375, -12.595703125, -11.6142578125, -10.6328125, -9.6513671875, -8.669921875, -7.6884765625, -6.70703125, -5.7255859375, -4.744140625, -3.7626953125, -2.78125, -1.7998046875, -0.818359375, 0.1630859375, 1.14453125, 2.1259765625, 3.107421875, 4.0888671875, 5.0703125, 6.0517578125, 7.033203125, 8.0146484375, 8.99609375, 9.9775390625, 10.958984375, 11.9404296875, 12.921875, 13.9033203125, 14.884765625, 15.8662109375, 16.84765625, 17.8291015625, 18.810546875, 19.7919921875, 20.7734375, 21.7548828125, 22.736328125, 23.7177734375, 24.69921875, 25.6806640625, 26.662109375, 27.6435546875, 28.625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 4.0, 2.0, 11.0, 16.0, 29.0, 29.0, 51.0, 70.0, 86.0, 97.0, 131.0, 113.0, 84.0, 76.0, 67.0, 54.0, 34.0, 23.0, 9.0, 9.0, 5.0, 6.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-26.75, -26.005615234375, -25.26123046875, -24.516845703125, -23.7724609375, -23.028076171875, -22.28369140625, -21.539306640625, -20.794921875, -20.050537109375, -19.30615234375, -18.561767578125, -17.8173828125, -17.072998046875, -16.32861328125, -15.584228515625, -14.83984375, -14.095458984375, -13.35107421875, -12.606689453125, -11.8623046875, -11.117919921875, -10.37353515625, -9.629150390625, -8.884765625, -8.140380859375, -7.39599609375, -6.651611328125, -5.9072265625, -5.162841796875, -4.41845703125, -3.674072265625, -2.9296875, -2.185302734375, -1.44091796875, -0.696533203125, 0.0478515625, 0.792236328125, 1.53662109375, 2.281005859375, 3.025390625, 3.769775390625, 4.51416015625, 5.258544921875, 6.0029296875, 6.747314453125, 7.49169921875, 8.236083984375, 8.98046875, 9.724853515625, 10.46923828125, 11.213623046875, 11.9580078125, 12.702392578125, 13.44677734375, 14.191162109375, 14.935546875, 15.679931640625, 16.42431640625, 17.168701171875, 17.9130859375, 18.657470703125, 19.40185546875, 20.146240234375, 20.890625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 2.0, 3.0, 2.0, 7.0, 4.0, 13.0, 19.0, 32.0, 74.0, 211.0, 927.0, 12957.0, 1013466.0, 19407.0, 1010.0, 264.0, 81.0, 37.0, 15.0, 9.0, 5.0, 4.0, 1.0, 4.0, 3.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.015625, -8.6883544921875, -8.361083984375, -8.0338134765625, -7.70654296875, -7.3792724609375, -7.052001953125, -6.7247314453125, -6.3974609375, -6.0701904296875, -5.742919921875, -5.4156494140625, -5.08837890625, -4.7611083984375, -4.433837890625, -4.1065673828125, -3.779296875, -3.4520263671875, -3.124755859375, -2.7974853515625, -2.47021484375, -2.1429443359375, -1.815673828125, -1.4884033203125, -1.1611328125, -0.8338623046875, -0.506591796875, -0.1793212890625, 0.14794921875, 0.4752197265625, 0.802490234375, 1.1297607421875, 1.45703125, 1.7843017578125, 2.111572265625, 2.4388427734375, 2.76611328125, 3.0933837890625, 3.420654296875, 3.7479248046875, 4.0751953125, 4.4024658203125, 4.729736328125, 5.0570068359375, 5.38427734375, 5.7115478515625, 6.038818359375, 6.3660888671875, 6.693359375, 7.0206298828125, 7.347900390625, 7.6751708984375, 8.00244140625, 8.3297119140625, 8.656982421875, 8.9842529296875, 9.3115234375, 9.6387939453125, 9.966064453125, 10.2933349609375, 10.62060546875, 10.9478759765625, 11.275146484375, 11.6024169921875, 11.9296875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 7.0, 12.0, 13.0, 11.0, 14.0, 25.0, 20.0, 37.0, 56.0, 76.0, 121.0, 127.0, 131.0, 102.0, 73.0, 40.0, 33.0, 18.0, 17.0, 17.0, 12.0, 9.0, 3.0, 4.0, 6.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0004487037658691406, -0.00043498724699020386, -0.0004212707281112671, -0.0004075542092323303, -0.00039383769035339355, -0.0003801211714744568, -0.00036640465259552, -0.00035268813371658325, -0.0003389716148376465, -0.0003252550959587097, -0.00031153857707977295, -0.0002978220582008362, -0.0002841055393218994, -0.00027038902044296265, -0.0002566725015640259, -0.0002429559826850891, -0.00022923946380615234, -0.00021552294492721558, -0.0002018064260482788, -0.00018808990716934204, -0.00017437338829040527, -0.0001606568694114685, -0.00014694035053253174, -0.00013322383165359497, -0.0001195073127746582, -0.00010579079389572144, -9.207427501678467e-05, -7.83577561378479e-05, -6.464123725891113e-05, -5.0924718379974365e-05, -3.72081995010376e-05, -2.349168062210083e-05, -9.775161743164062e-06, 3.941357135772705e-06, 1.7657876014709473e-05, 3.137439489364624e-05, 4.509091377258301e-05, 5.8807432651519775e-05, 7.252395153045654e-05, 8.624047040939331e-05, 9.995698928833008e-05, 0.00011367350816726685, 0.0001273900270462036, 0.00014110654592514038, 0.00015482306480407715, 0.00016853958368301392, 0.00018225610256195068, 0.00019597262144088745, 0.00020968914031982422, 0.00022340565919876099, 0.00023712217807769775, 0.0002508386969566345, 0.0002645552158355713, 0.00027827173471450806, 0.0002919882535934448, 0.0003057047724723816, 0.00031942129135131836, 0.0003331378102302551, 0.0003468543291091919, 0.00036057084798812866, 0.00037428736686706543, 0.0003880038857460022, 0.00040172040462493896, 0.00041543692350387573, 0.0004291534423828125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 23.0, 57.0, 215.0, 1952.0, 1039522.0, 6326.0, 288.0, 101.0, 35.0, 18.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.125, -27.4326171875, -26.740234375, -26.0478515625, -25.35546875, -24.6630859375, -23.970703125, -23.2783203125, -22.5859375, -21.8935546875, -21.201171875, -20.5087890625, -19.81640625, -19.1240234375, -18.431640625, -17.7392578125, -17.046875, -16.3544921875, -15.662109375, -14.9697265625, -14.27734375, -13.5849609375, -12.892578125, -12.2001953125, -11.5078125, -10.8154296875, -10.123046875, -9.4306640625, -8.73828125, -8.0458984375, -7.353515625, -6.6611328125, -5.96875, -5.2763671875, -4.583984375, -3.8916015625, -3.19921875, -2.5068359375, -1.814453125, -1.1220703125, -0.4296875, 0.2626953125, 0.955078125, 1.6474609375, 2.33984375, 3.0322265625, 3.724609375, 4.4169921875, 5.109375, 5.8017578125, 6.494140625, 7.1865234375, 7.87890625, 8.5712890625, 9.263671875, 9.9560546875, 10.6484375, 11.3408203125, 12.033203125, 12.7255859375, 13.41796875, 14.1103515625, 14.802734375, 15.4951171875, 16.1875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 13.0, 15.0, 23.0, 64.0, 115.0, 194.0, 210.0, 168.0, 76.0, 43.0, 28.0, 20.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.5078125, -6.31207275390625, -6.1163330078125, -5.92059326171875, -5.724853515625, -5.52911376953125, -5.3333740234375, -5.13763427734375, -4.94189453125, -4.74615478515625, -4.5504150390625, -4.35467529296875, -4.158935546875, -3.96319580078125, -3.7674560546875, -3.57171630859375, -3.3759765625, -3.18023681640625, -2.9844970703125, -2.78875732421875, -2.593017578125, -2.39727783203125, -2.2015380859375, -2.00579833984375, -1.81005859375, -1.61431884765625, -1.4185791015625, -1.22283935546875, -1.027099609375, -0.83135986328125, -0.6356201171875, -0.43988037109375, -0.244140625, -0.04840087890625, 0.1473388671875, 0.34307861328125, 0.538818359375, 0.73455810546875, 0.9302978515625, 1.12603759765625, 1.32177734375, 1.51751708984375, 1.7132568359375, 1.90899658203125, 2.104736328125, 2.30047607421875, 2.4962158203125, 2.69195556640625, 2.8876953125, 3.08343505859375, 3.2791748046875, 3.47491455078125, 3.670654296875, 3.86639404296875, 4.0621337890625, 4.25787353515625, 4.45361328125, 4.64935302734375, 4.8450927734375, 5.04083251953125, 5.236572265625, 5.43231201171875, 5.6280517578125, 5.82379150390625, 6.01953125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 14.0, 48.0, 200.0, 414.0, 228.0, 66.0, 27.0, 8.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-213.08163452148438, -207.52978515625, -201.97793579101562, -196.42608642578125, -190.87425231933594, -185.32240295410156, -179.7705535888672, -174.2187042236328, -168.66685485839844, -163.11500549316406, -157.5631561279297, -152.01132202148438, -146.45947265625, -140.90762329101562, -135.35577392578125, -129.80392456054688, -124.25208282470703, -118.70023345947266, -113.14839172363281, -107.59654235839844, -102.04469299316406, -96.49284362792969, -90.94100189208984, -85.38915252685547, -79.83731079101562, -74.28546142578125, -68.7336196899414, -63.18177032470703, -57.629920959472656, -52.07807540893555, -46.52622985839844, -40.97438049316406, -35.42253112792969, -29.870683670043945, -24.318836212158203, -18.766990661621094, -13.215143203735352, -7.663295745849609, -2.1114501953125, 3.440399169921875, 8.992244720458984, 14.544092178344727, 20.09593963623047, 25.647785186767578, 31.19963264465332, 36.75148010253906, 42.30332565307617, 47.85517501831055, 53.407020568847656, 58.958866119384766, 64.51071166992188, 70.06256103515625, 75.61441040039062, 81.166259765625, 86.71810150146484, 92.26995086669922, 97.82179260253906, 103.37364196777344, 108.92548370361328, 114.47733306884766, 120.02918243408203, 125.58102416992188, 131.13287353515625, 136.68472290039062, 142.236572265625]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 13.0, 9.0, 13.0, 19.0, 29.0, 28.0, 28.0, 33.0, 48.0, 54.0, 66.0, 69.0, 74.0, 75.0, 55.0, 54.0, 51.0, 45.0, 45.0, 42.0, 30.0, 27.0, 18.0, 20.0, 11.0, 10.0, 4.0, 7.0, 4.0, 5.0, 3.0, 0.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.224853515625, -65.13370513916016, -63.04255294799805, -60.9514045715332, -58.86025619506836, -56.76910400390625, -54.677955627441406, -52.58680725097656, -50.49565887451172, -48.404510498046875, -46.313358306884766, -44.22220993041992, -42.13106155395508, -40.03990936279297, -37.948760986328125, -35.85761260986328, -33.76646041870117, -31.675310134887695, -29.58416175842285, -27.493011474609375, -25.40186309814453, -23.310712814331055, -21.219562530517578, -19.128414154052734, -17.037263870239258, -14.946114540100098, -12.854965209960938, -10.763814926147461, -8.6726655960083, -6.581516265869141, -4.490365982055664, -2.399216651916504, -0.30806732177734375, 1.7830822467803955, 3.8742318153381348, 5.965381622314453, 8.056530952453613, 10.147680282592773, 12.23883056640625, 14.32997989654541, 16.42112922668457, 18.512279510498047, 20.60342788696289, 22.694578170776367, 24.785728454589844, 26.876876831054688, 28.968027114868164, 31.05917739868164, 33.150325775146484, 35.24147415161133, 37.33262634277344, 39.42377471923828, 41.514923095703125, 43.60607147216797, 45.69722366333008, 47.78837203979492, 49.87952423095703, 51.970672607421875, 54.061824798583984, 56.15297317504883, 58.24412155151367, 60.33527374267578, 62.426422119140625, 64.51757049560547, 66.60871887207031]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 5.0, 1.0, 2.0, 0.0, 7.0, 8.0, 6.0, 14.0, 15.0, 18.0, 25.0, 49.0, 69.0, 100.0, 183.0, 341.0, 795.0, 1781.0, 5434.0, 20725.0, 252441.0, 3808011.0, 85087.0, 13072.0, 3635.0, 1335.0, 557.0, 277.0, 147.0, 56.0, 42.0, 20.0, 13.0, 4.0, 11.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.23223876953125, -7.0152587890625, -6.79827880859375, -6.581298828125, -6.36431884765625, -6.1473388671875, -5.93035888671875, -5.71337890625, -5.49639892578125, -5.2794189453125, -5.06243896484375, -4.845458984375, -4.62847900390625, -4.4114990234375, -4.19451904296875, -3.9775390625, -3.76055908203125, -3.5435791015625, -3.32659912109375, -3.109619140625, -2.89263916015625, -2.6756591796875, -2.45867919921875, -2.24169921875, -2.02471923828125, -1.8077392578125, -1.59075927734375, -1.373779296875, -1.15679931640625, -0.9398193359375, -0.72283935546875, -0.505859375, -0.28887939453125, -0.0718994140625, 0.14508056640625, 0.362060546875, 0.57904052734375, 0.7960205078125, 1.01300048828125, 1.22998046875, 1.44696044921875, 1.6639404296875, 1.88092041015625, 2.097900390625, 2.31488037109375, 2.5318603515625, 2.74884033203125, 2.9658203125, 3.18280029296875, 3.3997802734375, 3.61676025390625, 3.833740234375, 4.05072021484375, 4.2677001953125, 4.48468017578125, 4.70166015625, 4.91864013671875, 5.1356201171875, 5.35260009765625, 5.569580078125, 5.78656005859375, 6.0035400390625, 6.22052001953125, 6.4375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 4.0, 12.0, 13.0, 11.0, 17.0, 28.0, 41.0, 41.0, 71.0, 65.0, 92.0, 81.0, 84.0, 75.0, 72.0, 69.0, 60.0, 49.0, 29.0, 26.0, 18.0, 15.0, 7.0, 4.0, 5.0, 2.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.02734375, -3.91912841796875, -3.8109130859375, -3.70269775390625, -3.594482421875, -3.48626708984375, -3.3780517578125, -3.26983642578125, -3.16162109375, -3.05340576171875, -2.9451904296875, -2.83697509765625, -2.728759765625, -2.62054443359375, -2.5123291015625, -2.40411376953125, -2.2958984375, -2.18768310546875, -2.0794677734375, -1.97125244140625, -1.863037109375, -1.75482177734375, -1.6466064453125, -1.53839111328125, -1.43017578125, -1.32196044921875, -1.2137451171875, -1.10552978515625, -0.997314453125, -0.88909912109375, -0.7808837890625, -0.67266845703125, -0.564453125, -0.45623779296875, -0.3480224609375, -0.23980712890625, -0.131591796875, -0.02337646484375, 0.0848388671875, 0.19305419921875, 0.30126953125, 0.40948486328125, 0.5177001953125, 0.62591552734375, 0.734130859375, 0.84234619140625, 0.9505615234375, 1.05877685546875, 1.1669921875, 1.27520751953125, 1.3834228515625, 1.49163818359375, 1.599853515625, 1.70806884765625, 1.8162841796875, 1.92449951171875, 2.03271484375, 2.14093017578125, 2.2491455078125, 2.35736083984375, 2.465576171875, 2.57379150390625, 2.6820068359375, 2.79022216796875, 2.8984375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 9.0, 22.0, 47.0, 79.0, 200.0, 633.0, 3613.0, 318603.0, 3863240.0, 6612.0, 824.0, 230.0, 95.0, 36.0, 16.0, 14.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.25, -21.59765625, -20.9453125, -20.29296875, -19.640625, -18.98828125, -18.3359375, -17.68359375, -17.03125, -16.37890625, -15.7265625, -15.07421875, -14.421875, -13.76953125, -13.1171875, -12.46484375, -11.8125, -11.16015625, -10.5078125, -9.85546875, -9.203125, -8.55078125, -7.8984375, -7.24609375, -6.59375, -5.94140625, -5.2890625, -4.63671875, -3.984375, -3.33203125, -2.6796875, -2.02734375, -1.375, -0.72265625, -0.0703125, 0.58203125, 1.234375, 1.88671875, 2.5390625, 3.19140625, 3.84375, 4.49609375, 5.1484375, 5.80078125, 6.453125, 7.10546875, 7.7578125, 8.41015625, 9.0625, 9.71484375, 10.3671875, 11.01953125, 11.671875, 12.32421875, 12.9765625, 13.62890625, 14.28125, 14.93359375, 15.5859375, 16.23828125, 16.890625, 17.54296875, 18.1953125, 18.84765625, 19.5]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 8.0, 7.0, 12.0, 26.0, 48.0, 76.0, 240.0, 1619.0, 1661.0, 231.0, 61.0, 40.0, 15.0, 12.0, 10.0, 5.0, 5.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.71875, -20.2587890625, -19.798828125, -19.3388671875, -18.87890625, -18.4189453125, -17.958984375, -17.4990234375, -17.0390625, -16.5791015625, -16.119140625, -15.6591796875, -15.19921875, -14.7392578125, -14.279296875, -13.8193359375, -13.359375, -12.8994140625, -12.439453125, -11.9794921875, -11.51953125, -11.0595703125, -10.599609375, -10.1396484375, -9.6796875, -9.2197265625, -8.759765625, -8.2998046875, -7.83984375, -7.3798828125, -6.919921875, -6.4599609375, -6.0, -5.5400390625, -5.080078125, -4.6201171875, -4.16015625, -3.7001953125, -3.240234375, -2.7802734375, -2.3203125, -1.8603515625, -1.400390625, -0.9404296875, -0.48046875, -0.0205078125, 0.439453125, 0.8994140625, 1.359375, 1.8193359375, 2.279296875, 2.7392578125, 3.19921875, 3.6591796875, 4.119140625, 4.5791015625, 5.0390625, 5.4990234375, 5.958984375, 6.4189453125, 6.87890625, 7.3388671875, 7.798828125, 8.2587890625, 8.71875]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 9.0, 17.0, 46.0, 88.0, 220.0, 279.0, 212.0, 65.0, 25.0, 5.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.6813735961914, -82.35697174072266, -80.0325698852539, -77.70816802978516, -75.38377380371094, -73.05937194824219, -70.73497009277344, -68.41056823730469, -66.08616638183594, -63.76176452636719, -61.43736267089844, -59.11296463012695, -56.7885627746582, -54.46416091918945, -52.13976287841797, -49.81536102294922, -47.49095916748047, -45.16655731201172, -42.84215545654297, -40.517757415771484, -38.193355560302734, -35.868953704833984, -33.5445556640625, -31.22015380859375, -28.895751953125, -26.57135009765625, -24.246950149536133, -21.922550201416016, -19.598148345947266, -17.273746490478516, -14.949346542358398, -12.624946594238281, -10.300537109375, -7.976136207580566, -5.651735305786133, -3.327334403991699, -1.0029335021972656, 1.321467399597168, 3.6458683013916016, 5.970268249511719, 8.294670104980469, 10.619071006774902, 12.943471908569336, 15.26787281036377, 17.592273712158203, 19.916675567626953, 22.24107551574707, 24.565475463867188, 26.889877319335938, 29.214279174804688, 31.538679122924805, 33.86307907104492, 36.18748092651367, 38.51188278198242, 40.836280822753906, 43.160682678222656, 45.485084533691406, 47.809486389160156, 50.133888244628906, 52.45828628540039, 54.78268814086914, 57.10708999633789, 59.431488037109375, 61.755889892578125, 64.08029174804688]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 8.0, 13.0, 14.0, 12.0, 24.0, 28.0, 50.0, 61.0, 73.0, 96.0, 98.0, 107.0, 96.0, 78.0, 86.0, 41.0, 35.0, 27.0, 17.0, 12.0, 16.0, 2.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.93637084960938, -74.90536499023438, -72.87435913085938, -70.84335327148438, -68.81234741210938, -66.78134155273438, -64.75033569335938, -62.71933364868164, -60.688331604003906, -58.657325744628906, -56.626319885253906, -54.595314025878906, -52.56431198120117, -50.53330612182617, -48.50230026245117, -46.47129440307617, -44.44028854370117, -42.40928268432617, -40.37827682495117, -38.34727478027344, -36.31626892089844, -34.28526306152344, -32.25425720214844, -30.223251342773438, -28.19224739074707, -26.16124153137207, -24.130237579345703, -22.099231719970703, -20.068225860595703, -18.037221908569336, -16.006216049194336, -13.975211143493652, -11.944206237792969, -9.913201332092285, -7.882195949554443, -5.851190567016602, -3.820185661315918, -1.7891807556152344, 0.24182510375976562, 2.272830009460449, 4.303834915161133, 6.334839820861816, 8.3658447265625, 10.3968505859375, 12.427855491638184, 14.458860397338867, 16.489866256713867, 18.520870208740234, 20.551876068115234, 22.582881927490234, 24.6138858795166, 26.6448917388916, 28.67589569091797, 30.70690155029297, 32.73790740966797, 34.76891326904297, 36.79991912841797, 38.83092498779297, 40.86193084716797, 42.89293670654297, 44.9239387512207, 46.9549446105957, 48.9859504699707, 51.0169563293457, 53.04795837402344]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 7.0, 5.0, 2.0, 5.0, 12.0, 21.0, 22.0, 46.0, 58.0, 82.0, 156.0, 252.0, 394.0, 580.0, 1085.0, 1867.0, 3669.0, 7315.0, 14740.0, 31690.0, 71695.0, 163541.0, 301480.0, 243118.0, 112883.0, 49504.0, 21950.0, 10662.0, 5301.0, 2754.0, 1480.0, 860.0, 477.0, 345.0, 173.0, 100.0, 77.0, 49.0, 29.0, 24.0, 17.0, 9.0, 8.0, 5.0, 3.0, 4.0, 6.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.82421875, -2.745269775390625, -2.66632080078125, -2.587371826171875, -2.5084228515625, -2.429473876953125, -2.35052490234375, -2.271575927734375, -2.192626953125, -2.113677978515625, -2.03472900390625, -1.955780029296875, -1.8768310546875, -1.797882080078125, -1.71893310546875, -1.639984130859375, -1.56103515625, -1.482086181640625, -1.40313720703125, -1.324188232421875, -1.2452392578125, -1.166290283203125, -1.08734130859375, -1.008392333984375, -0.929443359375, -0.850494384765625, -0.77154541015625, -0.692596435546875, -0.6136474609375, -0.534698486328125, -0.45574951171875, -0.376800537109375, -0.2978515625, -0.218902587890625, -0.13995361328125, -0.061004638671875, 0.0179443359375, 0.096893310546875, 0.17584228515625, 0.254791259765625, 0.333740234375, 0.412689208984375, 0.49163818359375, 0.570587158203125, 0.6495361328125, 0.728485107421875, 0.80743408203125, 0.886383056640625, 0.96533203125, 1.044281005859375, 1.12322998046875, 1.202178955078125, 1.2811279296875, 1.360076904296875, 1.43902587890625, 1.517974853515625, 1.596923828125, 1.675872802734375, 1.75482177734375, 1.833770751953125, 1.9127197265625, 1.991668701171875, 2.07061767578125, 2.149566650390625, 2.228515625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 14.0, 12.0, 14.0, 13.0, 21.0, 20.0, 27.0, 26.0, 44.0, 48.0, 49.0, 43.0, 58.0, 39.0, 56.0, 58.0, 59.0, 41.0, 38.0, 52.0, 36.0, 39.0, 32.0, 31.0, 19.0, 23.0, 11.0, 10.0, 7.0, 16.0, 5.0, 9.0, 3.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.044921875, -1.97857666015625, -1.9122314453125, -1.84588623046875, -1.779541015625, -1.71319580078125, -1.6468505859375, -1.58050537109375, -1.51416015625, -1.44781494140625, -1.3814697265625, -1.31512451171875, -1.248779296875, -1.18243408203125, -1.1160888671875, -1.04974365234375, -0.9833984375, -0.91705322265625, -0.8507080078125, -0.78436279296875, -0.718017578125, -0.65167236328125, -0.5853271484375, -0.51898193359375, -0.45263671875, -0.38629150390625, -0.3199462890625, -0.25360107421875, -0.187255859375, -0.12091064453125, -0.0545654296875, 0.01177978515625, 0.078125, 0.14447021484375, 0.2108154296875, 0.27716064453125, 0.343505859375, 0.40985107421875, 0.4761962890625, 0.54254150390625, 0.60888671875, 0.67523193359375, 0.7415771484375, 0.80792236328125, 0.874267578125, 0.94061279296875, 1.0069580078125, 1.07330322265625, 1.1396484375, 1.20599365234375, 1.2723388671875, 1.33868408203125, 1.405029296875, 1.47137451171875, 1.5377197265625, 1.60406494140625, 1.67041015625, 1.73675537109375, 1.8031005859375, 1.86944580078125, 1.935791015625, 2.00213623046875, 2.0684814453125, 2.13482666015625, 2.201171875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 2.0, 11.0, 10.0, 23.0, 32.0, 33.0, 40.0, 65.0, 92.0, 123.0, 181.0, 269.0, 431.0, 795.0, 1681.0, 4250.0, 17588.0, 157714.0, 739770.0, 105299.0, 13311.0, 3427.0, 1423.0, 735.0, 410.0, 279.0, 177.0, 116.0, 64.0, 39.0, 37.0, 38.0, 18.0, 13.0, 13.0, 10.0, 7.0, 5.0, 7.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.78125, -5.57781982421875, -5.3743896484375, -5.17095947265625, -4.967529296875, -4.76409912109375, -4.5606689453125, -4.35723876953125, -4.15380859375, -3.95037841796875, -3.7469482421875, -3.54351806640625, -3.340087890625, -3.13665771484375, -2.9332275390625, -2.72979736328125, -2.5263671875, -2.32293701171875, -2.1195068359375, -1.91607666015625, -1.712646484375, -1.50921630859375, -1.3057861328125, -1.10235595703125, -0.89892578125, -0.69549560546875, -0.4920654296875, -0.28863525390625, -0.085205078125, 0.11822509765625, 0.3216552734375, 0.52508544921875, 0.728515625, 0.93194580078125, 1.1353759765625, 1.33880615234375, 1.542236328125, 1.74566650390625, 1.9490966796875, 2.15252685546875, 2.35595703125, 2.55938720703125, 2.7628173828125, 2.96624755859375, 3.169677734375, 3.37310791015625, 3.5765380859375, 3.77996826171875, 3.9833984375, 4.18682861328125, 4.3902587890625, 4.59368896484375, 4.797119140625, 5.00054931640625, 5.2039794921875, 5.40740966796875, 5.61083984375, 5.81427001953125, 6.0177001953125, 6.22113037109375, 6.424560546875, 6.62799072265625, 6.8314208984375, 7.03485107421875, 7.23828125]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 9.0, 9.0, 5.0, 18.0, 11.0, 20.0, 21.0, 20.0, 30.0, 43.0, 64.0, 54.0, 52.0, 56.0, 53.0, 54.0, 66.0, 49.0, 59.0, 56.0, 33.0, 34.0, 38.0, 38.0, 30.0, 23.0, 14.0, 10.0, 9.0, 6.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.03125, -7.67919921875, -7.3271484375, -6.97509765625, -6.623046875, -6.27099609375, -5.9189453125, -5.56689453125, -5.21484375, -4.86279296875, -4.5107421875, -4.15869140625, -3.806640625, -3.45458984375, -3.1025390625, -2.75048828125, -2.3984375, -2.04638671875, -1.6943359375, -1.34228515625, -0.990234375, -0.63818359375, -0.2861328125, 0.06591796875, 0.41796875, 0.77001953125, 1.1220703125, 1.47412109375, 1.826171875, 2.17822265625, 2.5302734375, 2.88232421875, 3.234375, 3.58642578125, 3.9384765625, 4.29052734375, 4.642578125, 4.99462890625, 5.3466796875, 5.69873046875, 6.05078125, 6.40283203125, 6.7548828125, 7.10693359375, 7.458984375, 7.81103515625, 8.1630859375, 8.51513671875, 8.8671875, 9.21923828125, 9.5712890625, 9.92333984375, 10.275390625, 10.62744140625, 10.9794921875, 11.33154296875, 11.68359375, 12.03564453125, 12.3876953125, 12.73974609375, 13.091796875, 13.44384765625, 13.7958984375, 14.14794921875, 14.5]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 11.0, 7.0, 12.0, 29.0, 49.0, 88.0, 254.0, 1041.0, 8542.0, 942389.0, 92828.0, 2463.0, 506.0, 191.0, 75.0, 39.0, 12.0, 13.0, 1.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.6328125, -6.4420166015625, -6.251220703125, -6.0604248046875, -5.86962890625, -5.6788330078125, -5.488037109375, -5.2972412109375, -5.1064453125, -4.9156494140625, -4.724853515625, -4.5340576171875, -4.34326171875, -4.1524658203125, -3.961669921875, -3.7708740234375, -3.580078125, -3.3892822265625, -3.198486328125, -3.0076904296875, -2.81689453125, -2.6260986328125, -2.435302734375, -2.2445068359375, -2.0537109375, -1.8629150390625, -1.672119140625, -1.4813232421875, -1.29052734375, -1.0997314453125, -0.908935546875, -0.7181396484375, -0.52734375, -0.3365478515625, -0.145751953125, 0.0450439453125, 0.23583984375, 0.4266357421875, 0.617431640625, 0.8082275390625, 0.9990234375, 1.1898193359375, 1.380615234375, 1.5714111328125, 1.76220703125, 1.9530029296875, 2.143798828125, 2.3345947265625, 2.525390625, 2.7161865234375, 2.906982421875, 3.0977783203125, 3.28857421875, 3.4793701171875, 3.670166015625, 3.8609619140625, 4.0517578125, 4.2425537109375, 4.433349609375, 4.6241455078125, 4.81494140625, 5.0057373046875, 5.196533203125, 5.3873291015625, 5.578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 1.0, 4.0, 7.0, 12.0, 12.0, 48.0, 50.0, 70.0, 116.0, 138.0, 166.0, 114.0, 95.0, 61.0, 38.0, 23.0, 20.0, 7.0, 10.0, 8.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000583648681640625, -0.0005666688084602356, -0.0005496889352798462, -0.0005327090620994568, -0.0005157291889190674, -0.000498749315738678, -0.0004817694425582886, -0.00046478956937789917, -0.00044780969619750977, -0.00043082982301712036, -0.00041384994983673096, -0.00039687007665634155, -0.00037989020347595215, -0.00036291033029556274, -0.00034593045711517334, -0.00032895058393478394, -0.00031197071075439453, -0.0002949908375740051, -0.0002780109643936157, -0.0002610310912132263, -0.00024405121803283691, -0.0002270713448524475, -0.0002100914716720581, -0.0001931115984916687, -0.0001761317253112793, -0.0001591518521308899, -0.0001421719789505005, -0.00012519210577011108, -0.00010821223258972168, -9.123235940933228e-05, -7.425248622894287e-05, -5.727261304855347e-05, -4.029273986816406e-05, -2.3312866687774658e-05, -6.332993507385254e-06, 1.064687967300415e-05, 2.7626752853393555e-05, 4.460662603378296e-05, 6.158649921417236e-05, 7.856637239456177e-05, 9.554624557495117e-05, 0.00011252611875534058, 0.00012950599193572998, 0.00014648586511611938, 0.0001634657382965088, 0.0001804456114768982, 0.0001974254846572876, 0.000214405357837677, 0.0002313852310180664, 0.0002483651041984558, 0.0002653449773788452, 0.0002823248505592346, 0.000299304723739624, 0.00031628459692001343, 0.00033326447010040283, 0.00035024434328079224, 0.00036722421646118164, 0.00038420408964157104, 0.00040118396282196045, 0.00041816383600234985, 0.00043514370918273926, 0.00045212358236312866, 0.00046910345554351807, 0.00048608332872390747, 0.0005030632019042969]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 6.0, 3.0, 6.0, 8.0, 11.0, 19.0, 44.0, 69.0, 130.0, 287.0, 590.0, 1742.0, 8096.0, 128571.0, 857069.0, 45145.0, 4559.0, 1209.0, 473.0, 211.0, 129.0, 66.0, 37.0, 29.0, 15.0, 10.0, 6.0, 9.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.537109375, -3.437042236328125, -3.33697509765625, -3.236907958984375, -3.1368408203125, -3.036773681640625, -2.93670654296875, -2.836639404296875, -2.736572265625, -2.636505126953125, -2.53643798828125, -2.436370849609375, -2.3363037109375, -2.236236572265625, -2.13616943359375, -2.036102294921875, -1.93603515625, -1.835968017578125, -1.73590087890625, -1.635833740234375, -1.5357666015625, -1.435699462890625, -1.33563232421875, -1.235565185546875, -1.135498046875, -1.035430908203125, -0.93536376953125, -0.835296630859375, -0.7352294921875, -0.635162353515625, -0.53509521484375, -0.435028076171875, -0.3349609375, -0.234893798828125, -0.13482666015625, -0.034759521484375, 0.0653076171875, 0.165374755859375, 0.26544189453125, 0.365509033203125, 0.465576171875, 0.565643310546875, 0.66571044921875, 0.765777587890625, 0.8658447265625, 0.965911865234375, 1.06597900390625, 1.166046142578125, 1.26611328125, 1.366180419921875, 1.46624755859375, 1.566314697265625, 1.6663818359375, 1.766448974609375, 1.86651611328125, 1.966583251953125, 2.066650390625, 2.166717529296875, 2.26678466796875, 2.366851806640625, 2.4669189453125, 2.566986083984375, 2.66705322265625, 2.767120361328125, 2.8671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 6.0, 12.0, 17.0, 27.0, 44.0, 69.0, 90.0, 112.0, 129.0, 119.0, 111.0, 75.0, 56.0, 39.0, 34.0, 10.0, 16.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-4.078125, -3.97821044921875, -3.8782958984375, -3.77838134765625, -3.678466796875, -3.57855224609375, -3.4786376953125, -3.37872314453125, -3.27880859375, -3.17889404296875, -3.0789794921875, -2.97906494140625, -2.879150390625, -2.77923583984375, -2.6793212890625, -2.57940673828125, -2.4794921875, -2.37957763671875, -2.2796630859375, -2.17974853515625, -2.079833984375, -1.97991943359375, -1.8800048828125, -1.78009033203125, -1.68017578125, -1.58026123046875, -1.4803466796875, -1.38043212890625, -1.280517578125, -1.18060302734375, -1.0806884765625, -0.98077392578125, -0.880859375, -0.78094482421875, -0.6810302734375, -0.58111572265625, -0.481201171875, -0.38128662109375, -0.2813720703125, -0.18145751953125, -0.08154296875, 0.01837158203125, 0.1182861328125, 0.21820068359375, 0.318115234375, 0.41802978515625, 0.5179443359375, 0.61785888671875, 0.7177734375, 0.81768798828125, 0.9176025390625, 1.01751708984375, 1.117431640625, 1.21734619140625, 1.3172607421875, 1.41717529296875, 1.51708984375, 1.61700439453125, 1.7169189453125, 1.81683349609375, 1.916748046875, 2.01666259765625, 2.1165771484375, 2.21649169921875, 2.31640625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 10.0, 11.0, 20.0, 70.0, 258.0, 416.0, 167.0, 39.0, 14.0, 5.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.02415466308594, -105.8547592163086, -102.68536376953125, -99.51597595214844, -96.3465805053711, -93.17718505859375, -90.0077896118164, -86.83839416503906, -83.66900634765625, -80.4996109008789, -77.33021545410156, -74.16082763671875, -70.9914321899414, -67.82203674316406, -64.65264129638672, -61.48324966430664, -58.3138542175293, -55.14445877075195, -51.975067138671875, -48.80567169189453, -45.63628005981445, -42.46688461303711, -39.29749298095703, -36.12809753417969, -32.958702087402344, -29.789308547973633, -26.619915008544922, -23.450519561767578, -20.2811279296875, -17.111732482910156, -13.942338943481445, -10.772945404052734, -7.603553771972656, -4.434160232543945, -1.2647662162780762, 1.904627799987793, 5.074021339416504, 8.243414878845215, 11.412809371948242, 14.582202911376953, 17.751596450805664, 20.920989990234375, 24.090383529663086, 27.259777069091797, 30.42917251586914, 33.59856414794922, 36.76795959472656, 39.937355041503906, 43.106746673583984, 46.27614212036133, 49.445533752441406, 52.61492919921875, 55.78432083129883, 58.95371627807617, 62.12310791015625, 65.2925033569336, 68.46189880371094, 71.63129425048828, 74.80068969726562, 77.97007751464844, 81.13947296142578, 84.30886840820312, 87.47826385498047, 90.64765930175781, 93.81704711914062]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 2.0, 10.0, 2.0, 7.0, 12.0, 17.0, 13.0, 25.0, 19.0, 29.0, 33.0, 42.0, 42.0, 37.0, 59.0, 70.0, 66.0, 77.0, 55.0, 58.0, 51.0, 48.0, 34.0, 43.0, 27.0, 27.0, 20.0, 13.0, 15.0, 7.0, 8.0, 10.0, 4.0, 7.0, 2.0, 0.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.847957611083984, -37.507774353027344, -36.16758728027344, -34.8274040222168, -33.487220764160156, -32.147037506103516, -30.80685043334961, -29.46666717529297, -28.126483917236328, -26.786298751831055, -25.446115493774414, -24.10593032836914, -22.7657470703125, -21.425561904907227, -20.085376739501953, -18.745193481445312, -17.40500831604004, -16.064823150634766, -14.724639892578125, -13.384454727172852, -12.044271469116211, -10.704086303710938, -9.36390209197998, -8.023717880249023, -6.683533668518066, -5.343349456787109, -4.003165245056152, -2.662980556488037, -1.32279634475708, 0.017387866973876953, 1.3575725555419922, 2.697756767272949, 4.037940979003906, 5.378125190734863, 6.71830940246582, 8.058494567871094, 9.398677825927734, 10.738862991333008, 12.079047203063965, 13.419231414794922, 14.759415626525879, 16.099599838256836, 17.43978500366211, 18.77996826171875, 20.120153427124023, 21.460336685180664, 22.800521850585938, 24.140705108642578, 25.48089027404785, 26.821075439453125, 28.161258697509766, 29.50144386291504, 30.84162712097168, 32.18181228637695, 33.521995544433594, 34.8621826171875, 36.20236587524414, 37.54254913330078, 38.88273620605469, 40.22291946411133, 41.56310272216797, 42.90328598022461, 44.243473052978516, 45.583656311035156, 46.9238395690918]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 4.0, 5.0, 3.0, 13.0, 20.0, 12.0, 14.0, 20.0, 31.0, 45.0, 48.0, 75.0, 135.0, 228.0, 576.0, 1806.0, 7852.0, 79722.0, 3932864.0, 155293.0, 11526.0, 2488.0, 713.0, 287.0, 163.0, 99.0, 61.0, 39.0, 31.0, 26.0, 17.0, 14.0, 12.0, 9.0, 8.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.06201171875, -5.8701171875, -5.67822265625, -5.486328125, -5.29443359375, -5.1025390625, -4.91064453125, -4.71875, -4.52685546875, -4.3349609375, -4.14306640625, -3.951171875, -3.75927734375, -3.5673828125, -3.37548828125, -3.18359375, -2.99169921875, -2.7998046875, -2.60791015625, -2.416015625, -2.22412109375, -2.0322265625, -1.84033203125, -1.6484375, -1.45654296875, -1.2646484375, -1.07275390625, -0.880859375, -0.68896484375, -0.4970703125, -0.30517578125, -0.11328125, 0.07861328125, 0.2705078125, 0.46240234375, 0.654296875, 0.84619140625, 1.0380859375, 1.22998046875, 1.421875, 1.61376953125, 1.8056640625, 1.99755859375, 2.189453125, 2.38134765625, 2.5732421875, 2.76513671875, 2.95703125, 3.14892578125, 3.3408203125, 3.53271484375, 3.724609375, 3.91650390625, 4.1083984375, 4.30029296875, 4.4921875, 4.68408203125, 4.8759765625, 5.06787109375, 5.259765625, 5.45166015625, 5.6435546875, 5.83544921875, 6.02734375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 9.0, 12.0, 20.0, 31.0, 35.0, 55.0, 86.0, 129.0, 106.0, 112.0, 102.0, 77.0, 76.0, 59.0, 33.0, 24.0, 17.0, 9.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.89453125, -4.76983642578125, -4.6451416015625, -4.52044677734375, -4.395751953125, -4.27105712890625, -4.1463623046875, -4.02166748046875, -3.89697265625, -3.77227783203125, -3.6475830078125, -3.52288818359375, -3.398193359375, -3.27349853515625, -3.1488037109375, -3.02410888671875, -2.8994140625, -2.77471923828125, -2.6500244140625, -2.52532958984375, -2.400634765625, -2.27593994140625, -2.1512451171875, -2.02655029296875, -1.90185546875, -1.77716064453125, -1.6524658203125, -1.52777099609375, -1.403076171875, -1.27838134765625, -1.1536865234375, -1.02899169921875, -0.904296875, -0.77960205078125, -0.6549072265625, -0.53021240234375, -0.405517578125, -0.28082275390625, -0.1561279296875, -0.03143310546875, 0.09326171875, 0.21795654296875, 0.3426513671875, 0.46734619140625, 0.592041015625, 0.71673583984375, 0.8414306640625, 0.96612548828125, 1.0908203125, 1.21551513671875, 1.3402099609375, 1.46490478515625, 1.589599609375, 1.71429443359375, 1.8389892578125, 1.96368408203125, 2.08837890625, 2.21307373046875, 2.3377685546875, 2.46246337890625, 2.587158203125, 2.71185302734375, 2.8365478515625, 2.96124267578125, 3.0859375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 7.0, 7.0, 7.0, 16.0, 27.0, 41.0, 78.0, 164.0, 375.0, 864.0, 2118.0, 5501.0, 18220.0, 89646.0, 2888486.0, 1110253.0, 58454.0, 13002.0, 4145.0, 1620.0, 653.0, 300.0, 126.0, 64.0, 34.0, 20.0, 13.0, 14.0, 9.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.64453125, -4.51141357421875, -4.3782958984375, -4.24517822265625, -4.112060546875, -3.97894287109375, -3.8458251953125, -3.71270751953125, -3.57958984375, -3.44647216796875, -3.3133544921875, -3.18023681640625, -3.047119140625, -2.91400146484375, -2.7808837890625, -2.64776611328125, -2.5146484375, -2.38153076171875, -2.2484130859375, -2.11529541015625, -1.982177734375, -1.84906005859375, -1.7159423828125, -1.58282470703125, -1.44970703125, -1.31658935546875, -1.1834716796875, -1.05035400390625, -0.917236328125, -0.78411865234375, -0.6510009765625, -0.51788330078125, -0.384765625, -0.25164794921875, -0.1185302734375, 0.01458740234375, 0.147705078125, 0.28082275390625, 0.4139404296875, 0.54705810546875, 0.68017578125, 0.81329345703125, 0.9464111328125, 1.07952880859375, 1.212646484375, 1.34576416015625, 1.4788818359375, 1.61199951171875, 1.7451171875, 1.87823486328125, 2.0113525390625, 2.14447021484375, 2.277587890625, 2.41070556640625, 2.5438232421875, 2.67694091796875, 2.81005859375, 2.94317626953125, 3.0762939453125, 3.20941162109375, 3.342529296875, 3.47564697265625, 3.6087646484375, 3.74188232421875, 3.875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 10.0, 5.0, 9.0, 9.0, 19.0, 27.0, 25.0, 41.0, 72.0, 110.0, 232.0, 509.0, 1063.0, 923.0, 481.0, 216.0, 99.0, 71.0, 34.0, 33.0, 23.0, 9.0, 12.0, 4.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.18359375, -4.0526123046875, -3.921630859375, -3.7906494140625, -3.65966796875, -3.5286865234375, -3.397705078125, -3.2667236328125, -3.1357421875, -3.0047607421875, -2.873779296875, -2.7427978515625, -2.61181640625, -2.4808349609375, -2.349853515625, -2.2188720703125, -2.087890625, -1.9569091796875, -1.825927734375, -1.6949462890625, -1.56396484375, -1.4329833984375, -1.302001953125, -1.1710205078125, -1.0400390625, -0.9090576171875, -0.778076171875, -0.6470947265625, -0.51611328125, -0.3851318359375, -0.254150390625, -0.1231689453125, 0.0078125, 0.1387939453125, 0.269775390625, 0.4007568359375, 0.53173828125, 0.6627197265625, 0.793701171875, 0.9246826171875, 1.0556640625, 1.1866455078125, 1.317626953125, 1.4486083984375, 1.57958984375, 1.7105712890625, 1.841552734375, 1.9725341796875, 2.103515625, 2.2344970703125, 2.365478515625, 2.4964599609375, 2.62744140625, 2.7584228515625, 2.889404296875, 3.0203857421875, 3.1513671875, 3.2823486328125, 3.413330078125, 3.5443115234375, 3.67529296875, 3.8062744140625, 3.937255859375, 4.0682373046875, 4.19921875]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 10.0, 19.0, 67.0, 236.0, 430.0, 187.0, 44.0, 2.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.36293029785156, -43.234737396240234, -41.106544494628906, -38.97834777832031, -36.850154876708984, -34.721961975097656, -32.59376907348633, -30.465576171875, -28.33738136291504, -26.20918846130371, -24.08099365234375, -21.952800750732422, -19.824607849121094, -17.696413040161133, -15.568220138549805, -13.44002628326416, -11.311832427978516, -9.183638572692871, -7.055445194244385, -4.927251815795898, -2.799057960510254, -0.6708641052246094, 1.4573287963867188, 3.5855226516723633, 5.713716506958008, 7.841910362243652, 9.970104217529297, 12.098297119140625, 14.22649097442627, 16.354684829711914, 18.482877731323242, 20.611072540283203, 22.73926544189453, 24.86745834350586, 26.99565315246582, 29.12384605407715, 31.25204086303711, 33.38023376464844, 35.508426666259766, 37.636619567871094, 39.76481628417969, 41.893009185791016, 44.021202087402344, 46.14939880371094, 48.277591705322266, 50.405784606933594, 52.53397750854492, 54.66217041015625, 56.79036331176758, 58.918556213378906, 61.046749114990234, 63.17494201660156, 65.30313873291016, 67.43133544921875, 69.55952453613281, 71.6877212524414, 73.81591033935547, 75.94410705566406, 78.07229614257812, 80.20049285888672, 82.32868194580078, 84.45687866210938, 86.58506774902344, 88.71326446533203, 90.84146118164062]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 14.0, 14.0, 9.0, 17.0, 35.0, 34.0, 29.0, 46.0, 48.0, 61.0, 71.0, 75.0, 72.0, 75.0, 64.0, 55.0, 56.0, 46.0, 43.0, 31.0, 21.0, 25.0, 19.0, 11.0, 6.0, 7.0, 3.0, 1.0, 6.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.67819595336914, -20.949275970458984, -20.220355987548828, -19.491436004638672, -18.762514114379883, -18.033594131469727, -17.30467414855957, -16.575754165649414, -15.846833229064941, -15.117913246154785, -14.388992309570312, -13.660072326660156, -12.93115234375, -12.202231407165527, -11.473311424255371, -10.744390487670898, -10.015470504760742, -9.286550521850586, -8.557629585266113, -7.828709602355957, -7.099789142608643, -6.370868682861328, -5.641948699951172, -4.913028240203857, -4.184107780456543, -3.4551873207092285, -2.726267099380493, -1.9973468780517578, -1.2684264183044434, -0.5395059585571289, 0.18941402435302734, 0.9183344841003418, 1.6472549438476562, 2.3761754035949707, 3.105095624923706, 3.8340158462524414, 4.562936305999756, 5.29185676574707, 6.020776748657227, 6.749697208404541, 7.4786176681518555, 8.207537651062012, 8.936458587646484, 9.66537857055664, 10.394298553466797, 11.12321949005127, 11.852139472961426, 12.581060409545898, 13.309980392456055, 14.038900375366211, 14.767821311950684, 15.49674129486084, 16.225662231445312, 16.95458221435547, 17.683502197265625, 18.41242218017578, 19.141342163085938, 19.870262145996094, 20.59918212890625, 21.328102111816406, 22.057024002075195, 22.78594398498535, 23.514863967895508, 24.243783950805664, 24.972705841064453]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 7.0, 10.0, 12.0, 33.0, 35.0, 58.0, 92.0, 116.0, 206.0, 328.0, 540.0, 945.0, 1589.0, 2887.0, 5470.0, 11134.0, 24554.0, 57232.0, 135835.0, 287426.0, 284266.0, 132602.0, 55781.0, 24006.0, 11097.0, 5468.0, 2868.0, 1595.0, 939.0, 516.0, 337.0, 225.0, 112.0, 76.0, 61.0, 32.0, 24.0, 14.0, 12.0, 12.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.494140625, -2.416168212890625, -2.33819580078125, -2.260223388671875, -2.1822509765625, -2.104278564453125, -2.02630615234375, -1.948333740234375, -1.870361328125, -1.792388916015625, -1.71441650390625, -1.636444091796875, -1.5584716796875, -1.480499267578125, -1.40252685546875, -1.324554443359375, -1.24658203125, -1.168609619140625, -1.09063720703125, -1.012664794921875, -0.9346923828125, -0.856719970703125, -0.77874755859375, -0.700775146484375, -0.622802734375, -0.544830322265625, -0.46685791015625, -0.388885498046875, -0.3109130859375, -0.232940673828125, -0.15496826171875, -0.076995849609375, 0.0009765625, 0.078948974609375, 0.15692138671875, 0.234893798828125, 0.3128662109375, 0.390838623046875, 0.46881103515625, 0.546783447265625, 0.624755859375, 0.702728271484375, 0.78070068359375, 0.858673095703125, 0.9366455078125, 1.014617919921875, 1.09259033203125, 1.170562744140625, 1.24853515625, 1.326507568359375, 1.40447998046875, 1.482452392578125, 1.5604248046875, 1.638397216796875, 1.71636962890625, 1.794342041015625, 1.872314453125, 1.950286865234375, 2.02825927734375, 2.106231689453125, 2.1842041015625, 2.262176513671875, 2.34014892578125, 2.418121337890625, 2.49609375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 13.0, 19.0, 12.0, 20.0, 18.0, 32.0, 24.0, 33.0, 37.0, 49.0, 37.0, 48.0, 51.0, 44.0, 45.0, 49.0, 47.0, 40.0, 38.0, 45.0, 39.0, 32.0, 33.0, 27.0, 28.0, 22.0, 21.0, 19.0, 9.0, 11.0, 12.0, 6.0, 8.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.9296875, -1.8745880126953125, -1.819488525390625, -1.7643890380859375, -1.70928955078125, -1.6541900634765625, -1.599090576171875, -1.5439910888671875, -1.4888916015625, -1.4337921142578125, -1.378692626953125, -1.3235931396484375, -1.26849365234375, -1.2133941650390625, -1.158294677734375, -1.1031951904296875, -1.048095703125, -0.9929962158203125, -0.937896728515625, -0.8827972412109375, -0.82769775390625, -0.7725982666015625, -0.717498779296875, -0.6623992919921875, -0.6072998046875, -0.5522003173828125, -0.497100830078125, -0.4420013427734375, -0.38690185546875, -0.3318023681640625, -0.276702880859375, -0.2216033935546875, -0.16650390625, -0.1114044189453125, -0.056304931640625, -0.0012054443359375, 0.05389404296875, 0.1089935302734375, 0.164093017578125, 0.2191925048828125, 0.2742919921875, 0.3293914794921875, 0.384490966796875, 0.4395904541015625, 0.49468994140625, 0.5497894287109375, 0.604888916015625, 0.6599884033203125, 0.715087890625, 0.7701873779296875, 0.825286865234375, 0.8803863525390625, 0.93548583984375, 0.9905853271484375, 1.045684814453125, 1.1007843017578125, 1.1558837890625, 1.2109832763671875, 1.266082763671875, 1.3211822509765625, 1.37628173828125, 1.4313812255859375, 1.486480712890625, 1.5415802001953125, 1.5966796875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 8.0, 10.0, 24.0, 36.0, 52.0, 101.0, 178.0, 376.0, 838.0, 2698.0, 19422.0, 586660.0, 418045.0, 16011.0, 2471.0, 845.0, 364.0, 164.0, 91.0, 54.0, 41.0, 12.0, 19.0, 9.0, 3.0, 3.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.85546875, -6.55694580078125, -6.2584228515625, -5.95989990234375, -5.661376953125, -5.36285400390625, -5.0643310546875, -4.76580810546875, -4.46728515625, -4.16876220703125, -3.8702392578125, -3.57171630859375, -3.273193359375, -2.97467041015625, -2.6761474609375, -2.37762451171875, -2.0791015625, -1.78057861328125, -1.4820556640625, -1.18353271484375, -0.885009765625, -0.58648681640625, -0.2879638671875, 0.01055908203125, 0.30908203125, 0.60760498046875, 0.9061279296875, 1.20465087890625, 1.503173828125, 1.80169677734375, 2.1002197265625, 2.39874267578125, 2.697265625, 2.99578857421875, 3.2943115234375, 3.59283447265625, 3.891357421875, 4.18988037109375, 4.4884033203125, 4.78692626953125, 5.08544921875, 5.38397216796875, 5.6824951171875, 5.98101806640625, 6.279541015625, 6.57806396484375, 6.8765869140625, 7.17510986328125, 7.4736328125, 7.77215576171875, 8.0706787109375, 8.36920166015625, 8.667724609375, 8.96624755859375, 9.2647705078125, 9.56329345703125, 9.86181640625, 10.16033935546875, 10.4588623046875, 10.75738525390625, 11.055908203125, 11.35443115234375, 11.6529541015625, 11.95147705078125, 12.25]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 6.0, 8.0, 11.0, 10.0, 16.0, 19.0, 20.0, 28.0, 25.0, 35.0, 49.0, 50.0, 55.0, 52.0, 68.0, 58.0, 75.0, 48.0, 50.0, 51.0, 42.0, 33.0, 40.0, 27.0, 32.0, 21.0, 19.0, 15.0, 15.0, 12.0, 3.0, 5.0, 3.0, 0.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.265625, -7.006591796875, -6.74755859375, -6.488525390625, -6.2294921875, -5.970458984375, -5.71142578125, -5.452392578125, -5.193359375, -4.934326171875, -4.67529296875, -4.416259765625, -4.1572265625, -3.898193359375, -3.63916015625, -3.380126953125, -3.12109375, -2.862060546875, -2.60302734375, -2.343994140625, -2.0849609375, -1.825927734375, -1.56689453125, -1.307861328125, -1.048828125, -0.789794921875, -0.53076171875, -0.271728515625, -0.0126953125, 0.246337890625, 0.50537109375, 0.764404296875, 1.0234375, 1.282470703125, 1.54150390625, 1.800537109375, 2.0595703125, 2.318603515625, 2.57763671875, 2.836669921875, 3.095703125, 3.354736328125, 3.61376953125, 3.872802734375, 4.1318359375, 4.390869140625, 4.64990234375, 4.908935546875, 5.16796875, 5.427001953125, 5.68603515625, 5.945068359375, 6.2041015625, 6.463134765625, 6.72216796875, 6.981201171875, 7.240234375, 7.499267578125, 7.75830078125, 8.017333984375, 8.2763671875, 8.535400390625, 8.79443359375, 9.053466796875, 9.3125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 10.0, 16.0, 29.0, 31.0, 68.0, 102.0, 213.0, 541.0, 1664.0, 9416.0, 146409.0, 820964.0, 61573.0, 5513.0, 1192.0, 398.0, 172.0, 86.0, 47.0, 23.0, 20.0, 10.0, 10.0, 8.0, 8.0, 8.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.052734375, -2.958404541015625, -2.86407470703125, -2.769744873046875, -2.6754150390625, -2.581085205078125, -2.48675537109375, -2.392425537109375, -2.298095703125, -2.203765869140625, -2.10943603515625, -2.015106201171875, -1.9207763671875, -1.826446533203125, -1.73211669921875, -1.637786865234375, -1.54345703125, -1.449127197265625, -1.35479736328125, -1.260467529296875, -1.1661376953125, -1.071807861328125, -0.97747802734375, -0.883148193359375, -0.788818359375, -0.694488525390625, -0.60015869140625, -0.505828857421875, -0.4114990234375, -0.317169189453125, -0.22283935546875, -0.128509521484375, -0.0341796875, 0.060150146484375, 0.15447998046875, 0.248809814453125, 0.3431396484375, 0.437469482421875, 0.53179931640625, 0.626129150390625, 0.720458984375, 0.814788818359375, 0.90911865234375, 1.003448486328125, 1.0977783203125, 1.192108154296875, 1.28643798828125, 1.380767822265625, 1.47509765625, 1.569427490234375, 1.66375732421875, 1.758087158203125, 1.8524169921875, 1.946746826171875, 2.04107666015625, 2.135406494140625, 2.229736328125, 2.324066162109375, 2.41839599609375, 2.512725830078125, 2.6070556640625, 2.701385498046875, 2.79571533203125, 2.890045166015625, 2.984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 4.0, 1.0, 5.0, 5.0, 8.0, 8.0, 13.0, 23.0, 14.0, 33.0, 21.0, 37.0, 47.0, 58.0, 52.0, 60.0, 96.0, 77.0, 84.0, 55.0, 58.0, 53.0, 33.0, 30.0, 32.0, 26.0, 18.0, 12.0, 4.0, 8.0, 5.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00027370452880859375, -0.00026365742087364197, -0.0002536103129386902, -0.0002435632050037384, -0.00023351609706878662, -0.00022346898913383484, -0.00021342188119888306, -0.00020337477326393127, -0.0001933276653289795, -0.0001832805573940277, -0.00017323344945907593, -0.00016318634152412415, -0.00015313923358917236, -0.00014309212565422058, -0.0001330450177192688, -0.00012299790978431702, -0.00011295080184936523, -0.00010290369391441345, -9.285658597946167e-05, -8.280947804450989e-05, -7.27623701095581e-05, -6.271526217460632e-05, -5.266815423965454e-05, -4.262104630470276e-05, -3.2573938369750977e-05, -2.2526830434799194e-05, -1.2479722499847412e-05, -2.43261456489563e-06, 7.614493370056152e-06, 1.7661601305007935e-05, 2.7708709239959717e-05, 3.77558171749115e-05, 4.780292510986328e-05, 5.7850033044815063e-05, 6.789714097976685e-05, 7.794424891471863e-05, 8.799135684967041e-05, 9.803846478462219e-05, 0.00010808557271957397, 0.00011813268065452576, 0.00012817978858947754, 0.00013822689652442932, 0.0001482740044593811, 0.00015832111239433289, 0.00016836822032928467, 0.00017841532826423645, 0.00018846243619918823, 0.00019850954413414001, 0.0002085566520690918, 0.00021860376000404358, 0.00022865086793899536, 0.00023869797587394714, 0.0002487450838088989, 0.0002587921917438507, 0.0002688392996788025, 0.00027888640761375427, 0.00028893351554870605, 0.00029898062348365784, 0.0003090277314186096, 0.0003190748393535614, 0.0003291219472885132, 0.00033916905522346497, 0.00034921616315841675, 0.00035926327109336853, 0.0003693103790283203]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 17.0, 29.0, 39.0, 92.0, 168.0, 401.0, 1146.0, 4697.0, 51998.0, 845183.0, 134173.0, 7968.0, 1664.0, 505.0, 219.0, 109.0, 45.0, 25.0, 20.0, 16.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.880859375, -2.783660888671875, -2.68646240234375, -2.589263916015625, -2.4920654296875, -2.394866943359375, -2.29766845703125, -2.200469970703125, -2.103271484375, -2.006072998046875, -1.90887451171875, -1.811676025390625, -1.7144775390625, -1.617279052734375, -1.52008056640625, -1.422882080078125, -1.32568359375, -1.228485107421875, -1.13128662109375, -1.034088134765625, -0.9368896484375, -0.839691162109375, -0.74249267578125, -0.645294189453125, -0.548095703125, -0.450897216796875, -0.35369873046875, -0.256500244140625, -0.1593017578125, -0.062103271484375, 0.03509521484375, 0.132293701171875, 0.2294921875, 0.326690673828125, 0.42388916015625, 0.521087646484375, 0.6182861328125, 0.715484619140625, 0.81268310546875, 0.909881591796875, 1.007080078125, 1.104278564453125, 1.20147705078125, 1.298675537109375, 1.3958740234375, 1.493072509765625, 1.59027099609375, 1.687469482421875, 1.78466796875, 1.881866455078125, 1.97906494140625, 2.076263427734375, 2.1734619140625, 2.270660400390625, 2.36785888671875, 2.465057373046875, 2.562255859375, 2.659454345703125, 2.75665283203125, 2.853851318359375, 2.9510498046875, 3.048248291015625, 3.14544677734375, 3.242645263671875, 3.33984375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 5.0, 6.0, 9.0, 13.0, 19.0, 24.0, 25.0, 25.0, 44.0, 54.0, 56.0, 56.0, 74.0, 82.0, 87.0, 73.0, 59.0, 59.0, 40.0, 35.0, 39.0, 38.0, 24.0, 9.0, 12.0, 8.0, 10.0, 5.0, 2.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.09375, -2.0397186279296875, -1.985687255859375, -1.9316558837890625, -1.87762451171875, -1.8235931396484375, -1.769561767578125, -1.7155303955078125, -1.6614990234375, -1.6074676513671875, -1.553436279296875, -1.4994049072265625, -1.44537353515625, -1.3913421630859375, -1.337310791015625, -1.2832794189453125, -1.229248046875, -1.1752166748046875, -1.121185302734375, -1.0671539306640625, -1.01312255859375, -0.9590911865234375, -0.905059814453125, -0.8510284423828125, -0.7969970703125, -0.7429656982421875, -0.688934326171875, -0.6349029541015625, -0.58087158203125, -0.5268402099609375, -0.472808837890625, -0.4187774658203125, -0.36474609375, -0.3107147216796875, -0.256683349609375, -0.2026519775390625, -0.14862060546875, -0.0945892333984375, -0.040557861328125, 0.0134735107421875, 0.0675048828125, 0.1215362548828125, 0.175567626953125, 0.2295989990234375, 0.28363037109375, 0.3376617431640625, 0.391693115234375, 0.4457244873046875, 0.499755859375, 0.5537872314453125, 0.607818603515625, 0.6618499755859375, 0.71588134765625, 0.7699127197265625, 0.823944091796875, 0.8779754638671875, 0.9320068359375, 0.9860382080078125, 1.040069580078125, 1.0941009521484375, 1.14813232421875, 1.2021636962890625, 1.256195068359375, 1.3102264404296875, 1.3642578125]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 7.0, 16.0, 51.0, 145.0, 304.0, 232.0, 121.0, 66.0, 28.0, 13.0, 2.0, 8.0, 6.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.038732528686523, -20.14340591430664, -18.24808120727539, -16.352754592895508, -14.457428932189941, -12.562103271484375, -10.666776657104492, -8.771450996398926, -6.876125335693359, -4.980799674987793, -3.0854735374450684, -1.1901473999023438, 0.7051782608032227, 2.600503921508789, 4.495830535888672, 6.391156196594238, 8.286481857299805, 10.181807518005371, 12.077133178710938, 13.97245979309082, 15.867785453796387, 17.763111114501953, 19.658437728881836, 21.55376434326172, 23.44908905029297, 25.34441566467285, 27.2397403717041, 29.135066986083984, 31.030391693115234, 32.92572021484375, 34.821044921875, 36.71636962890625, 38.6116943359375, 40.50701904296875, 42.402347564697266, 44.297672271728516, 46.192996978759766, 48.08832550048828, 49.98365020751953, 51.87897491455078, 53.77429962158203, 55.66962432861328, 57.5649528503418, 59.46027755737305, 61.3556022644043, 63.25093078613281, 65.14625549316406, 67.04158020019531, 68.93690490722656, 70.83222961425781, 72.72755432128906, 74.62287902832031, 76.5182113647461, 78.41353607177734, 80.3088607788086, 82.20418548583984, 84.09951782226562, 85.99484252929688, 87.89016723632812, 89.78549194335938, 91.68082427978516, 93.5761489868164, 95.47147369384766, 97.3667984008789, 99.26212310791016]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 9.0, 7.0, 2.0, 7.0, 17.0, 15.0, 19.0, 19.0, 22.0, 15.0, 33.0, 31.0, 35.0, 37.0, 32.0, 53.0, 49.0, 79.0, 67.0, 54.0, 52.0, 45.0, 43.0, 40.0, 44.0, 27.0, 28.0, 23.0, 22.0, 19.0, 13.0, 15.0, 9.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.870561599731445, -22.933279037475586, -21.995996475219727, -21.058713912963867, -20.121431350708008, -19.18414878845215, -18.246868133544922, -17.309585571289062, -16.372303009033203, -15.435020446777344, -14.497737884521484, -13.560455322265625, -12.623172760009766, -11.685890197753906, -10.748608589172363, -9.811326026916504, -8.874042510986328, -7.936759948730469, -6.999477386474609, -6.062195301055908, -5.124912738800049, -4.1876301765441895, -3.2503480911254883, -2.313065528869629, -1.3757829666137695, -0.4385005235671997, 0.4987819194793701, 1.4360642433166504, 2.3733468055725098, 3.310629367828369, 4.24791145324707, 5.18519401550293, 6.122474670410156, 7.059757232666016, 7.997039794921875, 8.934322357177734, 9.871604919433594, 10.808887481689453, 11.746169090270996, 12.683451652526855, 13.620734214782715, 14.558016777038574, 15.495299339294434, 16.432580947875977, 17.369863510131836, 18.307146072387695, 19.244428634643555, 20.181711196899414, 21.118993759155273, 22.056276321411133, 22.993558883666992, 23.93084144592285, 24.86812400817871, 25.80540657043457, 26.742687225341797, 27.679969787597656, 28.617252349853516, 29.554534912109375, 30.491817474365234, 31.429100036621094, 32.36638259887695, 33.30366516113281, 34.24094772338867, 35.17823028564453, 36.11551284790039]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 3.0, 16.0, 11.0, 31.0, 25.0, 50.0, 89.0, 158.0, 384.0, 899.0, 2111.0, 5938.0, 19028.0, 89732.0, 1131962.0, 2681692.0, 216413.0, 32745.0, 8305.0, 2697.0, 971.0, 412.0, 230.0, 116.0, 80.0, 60.0, 36.0, 28.0, 17.0, 12.0, 8.0, 9.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.916015625, -1.8297119140625, -1.743408203125, -1.6571044921875, -1.57080078125, -1.4844970703125, -1.398193359375, -1.3118896484375, -1.2255859375, -1.1392822265625, -1.052978515625, -0.9666748046875, -0.88037109375, -0.7940673828125, -0.707763671875, -0.6214599609375, -0.53515625, -0.4488525390625, -0.362548828125, -0.2762451171875, -0.18994140625, -0.1036376953125, -0.017333984375, 0.0689697265625, 0.1552734375, 0.2415771484375, 0.327880859375, 0.4141845703125, 0.50048828125, 0.5867919921875, 0.673095703125, 0.7593994140625, 0.845703125, 0.9320068359375, 1.018310546875, 1.1046142578125, 1.19091796875, 1.2772216796875, 1.363525390625, 1.4498291015625, 1.5361328125, 1.6224365234375, 1.708740234375, 1.7950439453125, 1.88134765625, 1.9676513671875, 2.053955078125, 2.1402587890625, 2.2265625, 2.3128662109375, 2.399169921875, 2.4854736328125, 2.57177734375, 2.6580810546875, 2.744384765625, 2.8306884765625, 2.9169921875, 3.0032958984375, 3.089599609375, 3.1759033203125, 3.26220703125, 3.3485107421875, 3.434814453125, 3.5211181640625, 3.607421875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 12.0, 24.0, 31.0, 60.0, 50.0, 73.0, 88.0, 105.0, 82.0, 77.0, 89.0, 88.0, 78.0, 49.0, 36.0, 25.0, 19.0, 10.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6435546875, -1.5454254150390625, -1.447296142578125, -1.3491668701171875, -1.25103759765625, -1.1529083251953125, -1.054779052734375, -0.9566497802734375, -0.8585205078125, -0.7603912353515625, -0.662261962890625, -0.5641326904296875, -0.46600341796875, -0.3678741455078125, -0.269744873046875, -0.1716156005859375, -0.073486328125, 0.0246429443359375, 0.122772216796875, 0.2209014892578125, 0.31903076171875, 0.4171600341796875, 0.515289306640625, 0.6134185791015625, 0.7115478515625, 0.8096771240234375, 0.907806396484375, 1.0059356689453125, 1.10406494140625, 1.2021942138671875, 1.300323486328125, 1.3984527587890625, 1.49658203125, 1.5947113037109375, 1.692840576171875, 1.7909698486328125, 1.88909912109375, 1.9872283935546875, 2.085357666015625, 2.1834869384765625, 2.2816162109375, 2.3797454833984375, 2.477874755859375, 2.5760040283203125, 2.67413330078125, 2.7722625732421875, 2.870391845703125, 2.9685211181640625, 3.066650390625, 3.1647796630859375, 3.262908935546875, 3.3610382080078125, 3.45916748046875, 3.5572967529296875, 3.655426025390625, 3.7535552978515625, 3.8516845703125, 3.9498138427734375, 4.047943115234375, 4.1460723876953125, 4.24420166015625, 4.3423309326171875, 4.440460205078125, 4.5385894775390625, 4.63671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 6.0, 5.0, 7.0, 5.0, 9.0, 10.0, 17.0, 25.0, 30.0, 40.0, 69.0, 83.0, 134.0, 178.0, 340.0, 627.0, 1530.0, 4131.0, 13630.0, 57861.0, 477485.0, 3391223.0, 204009.0, 31458.0, 7436.0, 2137.0, 801.0, 391.0, 197.0, 121.0, 89.0, 62.0, 39.0, 26.0, 15.0, 15.0, 11.0, 8.0, 3.0, 6.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.42578125, -3.31292724609375, -3.2000732421875, -3.08721923828125, -2.974365234375, -2.86151123046875, -2.7486572265625, -2.63580322265625, -2.52294921875, -2.41009521484375, -2.2972412109375, -2.18438720703125, -2.071533203125, -1.95867919921875, -1.8458251953125, -1.73297119140625, -1.6201171875, -1.50726318359375, -1.3944091796875, -1.28155517578125, -1.168701171875, -1.05584716796875, -0.9429931640625, -0.83013916015625, -0.71728515625, -0.60443115234375, -0.4915771484375, -0.37872314453125, -0.265869140625, -0.15301513671875, -0.0401611328125, 0.07269287109375, 0.185546875, 0.29840087890625, 0.4112548828125, 0.52410888671875, 0.636962890625, 0.74981689453125, 0.8626708984375, 0.97552490234375, 1.08837890625, 1.20123291015625, 1.3140869140625, 1.42694091796875, 1.539794921875, 1.65264892578125, 1.7655029296875, 1.87835693359375, 1.9912109375, 2.10406494140625, 2.2169189453125, 2.32977294921875, 2.442626953125, 2.55548095703125, 2.6683349609375, 2.78118896484375, 2.89404296875, 3.00689697265625, 3.1197509765625, 3.23260498046875, 3.345458984375, 3.45831298828125, 3.5711669921875, 3.68402099609375, 3.796875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 2.0, 5.0, 10.0, 10.0, 14.0, 13.0, 13.0, 22.0, 28.0, 34.0, 38.0, 50.0, 76.0, 98.0, 156.0, 238.0, 440.0, 688.0, 679.0, 512.0, 334.0, 205.0, 99.0, 79.0, 43.0, 48.0, 29.0, 13.0, 18.0, 18.0, 7.0, 8.0, 6.0, 10.0, 6.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.845703125, -3.74237060546875, -3.6390380859375, -3.53570556640625, -3.432373046875, -3.32904052734375, -3.2257080078125, -3.12237548828125, -3.01904296875, -2.91571044921875, -2.8123779296875, -2.70904541015625, -2.605712890625, -2.50238037109375, -2.3990478515625, -2.29571533203125, -2.1923828125, -2.08905029296875, -1.9857177734375, -1.88238525390625, -1.779052734375, -1.67572021484375, -1.5723876953125, -1.46905517578125, -1.36572265625, -1.26239013671875, -1.1590576171875, -1.05572509765625, -0.952392578125, -0.84906005859375, -0.7457275390625, -0.64239501953125, -0.5390625, -0.43572998046875, -0.3323974609375, -0.22906494140625, -0.125732421875, -0.02239990234375, 0.0809326171875, 0.18426513671875, 0.28759765625, 0.39093017578125, 0.4942626953125, 0.59759521484375, 0.700927734375, 0.80426025390625, 0.9075927734375, 1.01092529296875, 1.1142578125, 1.21759033203125, 1.3209228515625, 1.42425537109375, 1.527587890625, 1.63092041015625, 1.7342529296875, 1.83758544921875, 1.94091796875, 2.04425048828125, 2.1475830078125, 2.25091552734375, 2.354248046875, 2.45758056640625, 2.5609130859375, 2.66424560546875, 2.767578125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 13.0, 24.0, 63.0, 144.0, 271.0, 290.0, 124.0, 36.0, 16.0, 10.0, 4.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.16636276245117, -48.43670654296875, -46.707054138183594, -44.97740173339844, -43.247745513916016, -41.518089294433594, -39.78843688964844, -38.05878448486328, -36.32912826538086, -34.59947204589844, -32.86981964111328, -31.140165328979492, -29.410511016845703, -27.680856704711914, -25.951202392578125, -24.221548080444336, -22.491893768310547, -20.762239456176758, -19.03258514404297, -17.30293083190918, -15.57327651977539, -13.843622207641602, -12.113967895507812, -10.384313583374023, -8.654659271240234, -6.925004959106445, -5.195350646972656, -3.465696334838867, -1.7360420227050781, -0.0063877105712890625, 1.7232666015625, 3.452920913696289, 5.1825714111328125, 6.912225723266602, 8.64188003540039, 10.37153434753418, 12.101188659667969, 13.830842971801758, 15.560497283935547, 17.290151596069336, 19.019805908203125, 20.749460220336914, 22.479114532470703, 24.208768844604492, 25.93842315673828, 27.66807746887207, 29.39773178100586, 31.12738609313965, 32.85704040527344, 34.586692810058594, 36.316349029541016, 38.04600524902344, 39.775657653808594, 41.50531005859375, 43.23496627807617, 44.964622497558594, 46.69427490234375, 48.423927307128906, 50.15358352661133, 51.88323974609375, 53.612892150878906, 55.34254455566406, 57.072200775146484, 58.801856994628906, 60.53150939941406]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 6.0, 4.0, 2.0, 18.0, 17.0, 21.0, 22.0, 28.0, 28.0, 49.0, 62.0, 75.0, 68.0, 82.0, 73.0, 59.0, 55.0, 61.0, 54.0, 46.0, 42.0, 42.0, 27.0, 26.0, 13.0, 11.0, 11.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.812461853027344, -32.86284255981445, -31.913219451904297, -30.963598251342773, -30.01397705078125, -29.06435775756836, -28.114736557006836, -27.165115356445312, -26.21549415588379, -25.265872955322266, -24.316251754760742, -23.36663055419922, -22.417011260986328, -21.467388153076172, -20.51776885986328, -19.568147659301758, -18.618526458740234, -17.66890525817871, -16.719284057617188, -15.76966381072998, -14.820042610168457, -13.870421409606934, -12.920801162719727, -11.971179962158203, -11.02155876159668, -10.071937561035156, -9.122316360473633, -8.172696113586426, -7.223074913024902, -6.273453712463379, -5.323832988739014, -4.374212265014648, -3.424591064453125, -2.4749701023101807, -1.5253491401672363, -0.575728178024292, 0.37389278411865234, 1.3235139846801758, 2.273134708404541, 3.2227554321289062, 4.17237663269043, 5.121997833251953, 6.071618556976318, 7.021239280700684, 7.970860481262207, 8.92048168182373, 9.870101928710938, 10.819723129272461, 11.769344329833984, 12.718965530395508, 13.668586730957031, 14.618206977844238, 15.567828178405762, 16.51744842529297, 17.467069625854492, 18.416690826416016, 19.36631202697754, 20.315933227539062, 21.265554428100586, 22.21517562866211, 23.164794921875, 24.114418029785156, 25.064037322998047, 26.01365852355957, 26.963279724121094]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 12.0, 11.0, 8.0, 14.0, 23.0, 37.0, 49.0, 67.0, 91.0, 142.0, 223.0, 349.0, 549.0, 869.0, 1467.0, 2492.0, 4614.0, 8096.0, 14987.0, 28100.0, 51471.0, 91328.0, 150980.0, 206687.0, 191068.0, 127798.0, 74557.0, 41465.0, 22723.0, 12233.0, 6718.0, 3826.0, 2100.0, 1266.0, 773.0, 465.0, 313.0, 189.0, 120.0, 76.0, 52.0, 48.0, 24.0, 19.0, 17.0, 8.0, 15.0, 3.0, 2.0, 1.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-1.4765625, -1.43157958984375, -1.3865966796875, -1.34161376953125, -1.296630859375, -1.25164794921875, -1.2066650390625, -1.16168212890625, -1.11669921875, -1.07171630859375, -1.0267333984375, -0.98175048828125, -0.936767578125, -0.89178466796875, -0.8468017578125, -0.80181884765625, -0.7568359375, -0.71185302734375, -0.6668701171875, -0.62188720703125, -0.576904296875, -0.53192138671875, -0.4869384765625, -0.44195556640625, -0.39697265625, -0.35198974609375, -0.3070068359375, -0.26202392578125, -0.217041015625, -0.17205810546875, -0.1270751953125, -0.08209228515625, -0.037109375, 0.00787353515625, 0.0528564453125, 0.09783935546875, 0.142822265625, 0.18780517578125, 0.2327880859375, 0.27777099609375, 0.32275390625, 0.36773681640625, 0.4127197265625, 0.45770263671875, 0.502685546875, 0.54766845703125, 0.5926513671875, 0.63763427734375, 0.6826171875, 0.72760009765625, 0.7725830078125, 0.81756591796875, 0.862548828125, 0.90753173828125, 0.9525146484375, 0.99749755859375, 1.04248046875, 1.08746337890625, 1.1324462890625, 1.17742919921875, 1.222412109375, 1.26739501953125, 1.3123779296875, 1.35736083984375, 1.40234375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 4.0, 3.0, 10.0, 10.0, 9.0, 7.0, 20.0, 16.0, 15.0, 26.0, 30.0, 24.0, 27.0, 26.0, 30.0, 35.0, 44.0, 65.0, 42.0, 33.0, 41.0, 36.0, 45.0, 31.0, 43.0, 31.0, 39.0, 25.0, 25.0, 29.0, 36.0, 19.0, 24.0, 16.0, 8.0, 10.0, 14.0, 12.0, 9.0, 12.0, 5.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-1.29296875, -1.25244140625, -1.2119140625, -1.17138671875, -1.130859375, -1.09033203125, -1.0498046875, -1.00927734375, -0.96875, -0.92822265625, -0.8876953125, -0.84716796875, -0.806640625, -0.76611328125, -0.7255859375, -0.68505859375, -0.64453125, -0.60400390625, -0.5634765625, -0.52294921875, -0.482421875, -0.44189453125, -0.4013671875, -0.36083984375, -0.3203125, -0.27978515625, -0.2392578125, -0.19873046875, -0.158203125, -0.11767578125, -0.0771484375, -0.03662109375, 0.00390625, 0.04443359375, 0.0849609375, 0.12548828125, 0.166015625, 0.20654296875, 0.2470703125, 0.28759765625, 0.328125, 0.36865234375, 0.4091796875, 0.44970703125, 0.490234375, 0.53076171875, 0.5712890625, 0.61181640625, 0.65234375, 0.69287109375, 0.7333984375, 0.77392578125, 0.814453125, 0.85498046875, 0.8955078125, 0.93603515625, 0.9765625, 1.01708984375, 1.0576171875, 1.09814453125, 1.138671875, 1.17919921875, 1.2197265625, 1.26025390625, 1.30078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 12.0, 9.0, 14.0, 17.0, 23.0, 27.0, 39.0, 57.0, 79.0, 84.0, 138.0, 209.0, 314.0, 409.0, 852.0, 1494.0, 3604.0, 13829.0, 121096.0, 738037.0, 143736.0, 16276.0, 4016.0, 1604.0, 847.0, 536.0, 353.0, 243.0, 172.0, 121.0, 103.0, 56.0, 42.0, 32.0, 19.0, 17.0, 12.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.298583984375, -4.14794921875, -3.997314453125, -3.8466796875, -3.696044921875, -3.54541015625, -3.394775390625, -3.244140625, -3.093505859375, -2.94287109375, -2.792236328125, -2.6416015625, -2.490966796875, -2.34033203125, -2.189697265625, -2.0390625, -1.888427734375, -1.73779296875, -1.587158203125, -1.4365234375, -1.285888671875, -1.13525390625, -0.984619140625, -0.833984375, -0.683349609375, -0.53271484375, -0.382080078125, -0.2314453125, -0.080810546875, 0.06982421875, 0.220458984375, 0.37109375, 0.521728515625, 0.67236328125, 0.822998046875, 0.9736328125, 1.124267578125, 1.27490234375, 1.425537109375, 1.576171875, 1.726806640625, 1.87744140625, 2.028076171875, 2.1787109375, 2.329345703125, 2.47998046875, 2.630615234375, 2.78125, 2.931884765625, 3.08251953125, 3.233154296875, 3.3837890625, 3.534423828125, 3.68505859375, 3.835693359375, 3.986328125, 4.136962890625, 4.28759765625, 4.438232421875, 4.5888671875, 4.739501953125, 4.89013671875, 5.040771484375, 5.19140625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 4.0, 10.0, 4.0, 7.0, 13.0, 15.0, 16.0, 16.0, 27.0, 20.0, 34.0, 32.0, 36.0, 31.0, 49.0, 38.0, 50.0, 41.0, 52.0, 45.0, 48.0, 44.0, 48.0, 45.0, 36.0, 41.0, 33.0, 27.0, 24.0, 21.0, 20.0, 21.0, 12.0, 7.0, 9.0, 9.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.53125, -5.35302734375, -5.1748046875, -4.99658203125, -4.818359375, -4.64013671875, -4.4619140625, -4.28369140625, -4.10546875, -3.92724609375, -3.7490234375, -3.57080078125, -3.392578125, -3.21435546875, -3.0361328125, -2.85791015625, -2.6796875, -2.50146484375, -2.3232421875, -2.14501953125, -1.966796875, -1.78857421875, -1.6103515625, -1.43212890625, -1.25390625, -1.07568359375, -0.8974609375, -0.71923828125, -0.541015625, -0.36279296875, -0.1845703125, -0.00634765625, 0.171875, 0.35009765625, 0.5283203125, 0.70654296875, 0.884765625, 1.06298828125, 1.2412109375, 1.41943359375, 1.59765625, 1.77587890625, 1.9541015625, 2.13232421875, 2.310546875, 2.48876953125, 2.6669921875, 2.84521484375, 3.0234375, 3.20166015625, 3.3798828125, 3.55810546875, 3.736328125, 3.91455078125, 4.0927734375, 4.27099609375, 4.44921875, 4.62744140625, 4.8056640625, 4.98388671875, 5.162109375, 5.34033203125, 5.5185546875, 5.69677734375, 5.875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 1.0, 3.0, 5.0, 2.0, 7.0, 5.0, 12.0, 26.0, 41.0, 89.0, 176.0, 522.0, 1833.0, 12576.0, 489513.0, 528381.0, 12645.0, 1786.0, 509.0, 220.0, 97.0, 37.0, 20.0, 17.0, 9.0, 5.0, 5.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.821319580078125, -2.73834228515625, -2.655364990234375, -2.5723876953125, -2.489410400390625, -2.40643310546875, -2.323455810546875, -2.240478515625, -2.157501220703125, -2.07452392578125, -1.991546630859375, -1.9085693359375, -1.825592041015625, -1.74261474609375, -1.659637451171875, -1.57666015625, -1.493682861328125, -1.41070556640625, -1.327728271484375, -1.2447509765625, -1.161773681640625, -1.07879638671875, -0.995819091796875, -0.912841796875, -0.829864501953125, -0.74688720703125, -0.663909912109375, -0.5809326171875, -0.497955322265625, -0.41497802734375, -0.332000732421875, -0.2490234375, -0.166046142578125, -0.08306884765625, -9.1552734375e-05, 0.0828857421875, 0.165863037109375, 0.24884033203125, 0.331817626953125, 0.414794921875, 0.497772216796875, 0.58074951171875, 0.663726806640625, 0.7467041015625, 0.829681396484375, 0.91265869140625, 0.995635986328125, 1.07861328125, 1.161590576171875, 1.24456787109375, 1.327545166015625, 1.4105224609375, 1.493499755859375, 1.57647705078125, 1.659454345703125, 1.742431640625, 1.825408935546875, 1.90838623046875, 1.991363525390625, 2.0743408203125, 2.157318115234375, 2.24029541015625, 2.323272705078125, 2.40625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 2.0, 4.0, 2.0, 6.0, 4.0, 9.0, 9.0, 23.0, 23.0, 33.0, 39.0, 51.0, 66.0, 70.0, 92.0, 92.0, 89.0, 81.0, 67.0, 48.0, 45.0, 38.0, 31.0, 25.0, 15.0, 8.0, 8.0, 9.0, 7.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00031948089599609375, -0.00030946359038352966, -0.0002994462847709656, -0.0002894289791584015, -0.0002794116735458374, -0.0002693943679332733, -0.00025937706232070923, -0.00024935975670814514, -0.00023934245109558105, -0.00022932514548301697, -0.00021930783987045288, -0.0002092905342578888, -0.0001992732286453247, -0.00018925592303276062, -0.00017923861742019653, -0.00016922131180763245, -0.00015920400619506836, -0.00014918670058250427, -0.00013916939496994019, -0.0001291520893573761, -0.00011913478374481201, -0.00010911747813224792, -9.910017251968384e-05, -8.908286690711975e-05, -7.906556129455566e-05, -6.904825568199158e-05, -5.903095006942749e-05, -4.90136444568634e-05, -3.8996338844299316e-05, -2.897903323173523e-05, -1.8961727619171143e-05, -8.944422006607056e-06, 1.0728836059570312e-06, 1.1090189218521118e-05, 2.1107494831085205e-05, 3.112480044364929e-05, 4.114210605621338e-05, 5.1159411668777466e-05, 6.117671728134155e-05, 7.119402289390564e-05, 8.121132850646973e-05, 9.122863411903381e-05, 0.0001012459397315979, 0.00011126324534416199, 0.00012128055095672607, 0.00013129785656929016, 0.00014131516218185425, 0.00015133246779441833, 0.00016134977340698242, 0.0001713670790195465, 0.0001813843846321106, 0.00019140169024467468, 0.00020141899585723877, 0.00021143630146980286, 0.00022145360708236694, 0.00023147091269493103, 0.00024148821830749512, 0.0002515055239200592, 0.0002615228295326233, 0.0002715401351451874, 0.00028155744075775146, 0.00029157474637031555, 0.00030159205198287964, 0.0003116093575954437, 0.0003216266632080078]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 9.0, 7.0, 8.0, 21.0, 22.0, 38.0, 63.0, 117.0, 194.0, 312.0, 623.0, 1536.0, 4885.0, 23555.0, 292734.0, 671760.0, 42005.0, 6860.0, 2055.0, 820.0, 369.0, 226.0, 131.0, 83.0, 34.0, 30.0, 20.0, 10.0, 11.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.515625, -1.46533203125, -1.4150390625, -1.36474609375, -1.314453125, -1.26416015625, -1.2138671875, -1.16357421875, -1.11328125, -1.06298828125, -1.0126953125, -0.96240234375, -0.912109375, -0.86181640625, -0.8115234375, -0.76123046875, -0.7109375, -0.66064453125, -0.6103515625, -0.56005859375, -0.509765625, -0.45947265625, -0.4091796875, -0.35888671875, -0.30859375, -0.25830078125, -0.2080078125, -0.15771484375, -0.107421875, -0.05712890625, -0.0068359375, 0.04345703125, 0.09375, 0.14404296875, 0.1943359375, 0.24462890625, 0.294921875, 0.34521484375, 0.3955078125, 0.44580078125, 0.49609375, 0.54638671875, 0.5966796875, 0.64697265625, 0.697265625, 0.74755859375, 0.7978515625, 0.84814453125, 0.8984375, 0.94873046875, 0.9990234375, 1.04931640625, 1.099609375, 1.14990234375, 1.2001953125, 1.25048828125, 1.30078125, 1.35107421875, 1.4013671875, 1.45166015625, 1.501953125, 1.55224609375, 1.6025390625, 1.65283203125, 1.703125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 6.0, 2.0, 2.0, 7.0, 5.0, 7.0, 18.0, 18.0, 15.0, 26.0, 19.0, 37.0, 25.0, 38.0, 50.0, 83.0, 88.0, 68.0, 76.0, 75.0, 58.0, 44.0, 54.0, 39.0, 28.0, 21.0, 21.0, 16.0, 12.0, 14.0, 8.0, 2.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.3583984375, -1.3203277587890625, -1.282257080078125, -1.2441864013671875, -1.20611572265625, -1.1680450439453125, -1.129974365234375, -1.0919036865234375, -1.0538330078125, -1.0157623291015625, -0.977691650390625, -0.9396209716796875, -0.90155029296875, -0.8634796142578125, -0.825408935546875, -0.7873382568359375, -0.749267578125, -0.7111968994140625, -0.673126220703125, -0.6350555419921875, -0.59698486328125, -0.5589141845703125, -0.520843505859375, -0.4827728271484375, -0.4447021484375, -0.4066314697265625, -0.368560791015625, -0.3304901123046875, -0.29241943359375, -0.2543487548828125, -0.216278076171875, -0.1782073974609375, -0.14013671875, -0.1020660400390625, -0.063995361328125, -0.0259246826171875, 0.01214599609375, 0.0502166748046875, 0.088287353515625, 0.1263580322265625, 0.1644287109375, 0.2024993896484375, 0.240570068359375, 0.2786407470703125, 0.31671142578125, 0.3547821044921875, 0.392852783203125, 0.4309234619140625, 0.468994140625, 0.5070648193359375, 0.545135498046875, 0.5832061767578125, 0.62127685546875, 0.6593475341796875, 0.697418212890625, 0.7354888916015625, 0.7735595703125, 0.8116302490234375, 0.849700927734375, 0.8877716064453125, 0.92584228515625, 0.9639129638671875, 1.001983642578125, 1.0400543212890625, 1.078125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 18.0, 29.0, 100.0, 202.0, 322.0, 165.0, 90.0, 30.0, 10.0, 10.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.919282913208008, -25.526775360107422, -24.13426971435547, -22.741764068603516, -21.34925651550293, -19.956748962402344, -18.56424331665039, -17.171737670898438, -15.779230117797852, -14.386723518371582, -12.994216918945312, -11.601710319519043, -10.209203720092773, -8.816697120666504, -7.424190521240234, -6.031683921813965, -4.639177322387695, -3.246670722961426, -1.8541641235351562, -0.4616575241088867, 0.9308490753173828, 2.3233556747436523, 3.715862274169922, 5.108368873596191, 6.500875473022461, 7.8933820724487305, 9.285888671875, 10.67839527130127, 12.070901870727539, 13.463408470153809, 14.855915069580078, 16.24842071533203, 17.64093017578125, 19.033435821533203, 20.42594337463379, 21.818450927734375, 23.210956573486328, 24.60346221923828, 25.995969772338867, 27.388477325439453, 28.780982971191406, 30.17348861694336, 31.565996170043945, 32.95850372314453, 34.351009368896484, 35.74351501464844, 37.136024475097656, 38.52853012084961, 39.92103576660156, 41.313541412353516, 42.70604705810547, 44.09855651855469, 45.49106216430664, 46.883567810058594, 48.27607727050781, 49.668582916259766, 51.06108856201172, 52.45359420776367, 53.846099853515625, 55.238609313964844, 56.6311149597168, 58.02362060546875, 59.41613006591797, 60.80863571166992, 62.201141357421875]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 6.0, 7.0, 4.0, 12.0, 8.0, 5.0, 13.0, 19.0, 17.0, 27.0, 21.0, 25.0, 21.0, 22.0, 25.0, 32.0, 22.0, 50.0, 41.0, 62.0, 65.0, 54.0, 51.0, 57.0, 44.0, 37.0, 35.0, 31.0, 30.0, 20.0, 21.0, 15.0, 19.0, 14.0, 7.0, 9.0, 8.0, 7.0, 9.0, 6.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-21.53299331665039, -20.853647232055664, -20.174301147460938, -19.494953155517578, -18.81560707092285, -18.136260986328125, -17.4569149017334, -16.777568817138672, -16.098222732543945, -15.418876647949219, -14.739529609680176, -14.06018352508545, -13.380837440490723, -12.70149040222168, -12.022144317626953, -11.342798233032227, -10.663451194763184, -9.984105110168457, -9.304758071899414, -8.625411987304688, -7.946065902709961, -7.266719341278076, -6.587372779846191, -5.908026695251465, -5.22868013381958, -4.549333572387695, -3.8699874877929688, -3.190640926361084, -2.5112946033477783, -1.8319482803344727, -1.152601718902588, -0.47325563430786133, 0.20609092712402344, 0.8854373097419739, 1.5647836923599243, 2.2441301345825195, 2.923476457595825, 3.602822780609131, 4.282169342041016, 4.961515426635742, 5.640861988067627, 6.320208549499512, 6.999554634094238, 7.678901195526123, 8.358247756958008, 9.037593841552734, 9.716939926147461, 10.396286010742188, 11.07563304901123, 11.754979133605957, 12.434326171875, 13.113672256469727, 13.793018341064453, 14.47236442565918, 15.151711463928223, 15.83105754852295, 16.510404586791992, 17.18975067138672, 17.869096755981445, 18.548442840576172, 19.22779083251953, 19.907136917114258, 20.586483001708984, 21.26582908630371, 21.945175170898438]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 9.0, 16.0, 25.0, 32.0, 51.0, 93.0, 155.0, 245.0, 474.0, 924.0, 1830.0, 4303.0, 11295.0, 34821.0, 142238.0, 742565.0, 2137553.0, 890342.0, 165115.0, 40160.0, 12838.0, 4971.0, 2094.0, 989.0, 466.0, 275.0, 172.0, 85.0, 35.0, 31.0, 23.0, 14.0, 7.0, 8.0, 4.0, 5.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2001953125, -1.153228759765625, -1.10626220703125, -1.059295654296875, -1.0123291015625, -0.965362548828125, -0.91839599609375, -0.871429443359375, -0.824462890625, -0.777496337890625, -0.73052978515625, -0.683563232421875, -0.6365966796875, -0.589630126953125, -0.54266357421875, -0.495697021484375, -0.44873046875, -0.401763916015625, -0.35479736328125, -0.307830810546875, -0.2608642578125, -0.213897705078125, -0.16693115234375, -0.119964599609375, -0.072998046875, -0.026031494140625, 0.02093505859375, 0.067901611328125, 0.1148681640625, 0.161834716796875, 0.20880126953125, 0.255767822265625, 0.302734375, 0.349700927734375, 0.39666748046875, 0.443634033203125, 0.4906005859375, 0.537567138671875, 0.58453369140625, 0.631500244140625, 0.678466796875, 0.725433349609375, 0.77239990234375, 0.819366455078125, 0.8663330078125, 0.913299560546875, 0.96026611328125, 1.007232666015625, 1.05419921875, 1.101165771484375, 1.14813232421875, 1.195098876953125, 1.2420654296875, 1.289031982421875, 1.33599853515625, 1.382965087890625, 1.429931640625, 1.476898193359375, 1.52386474609375, 1.570831298828125, 1.6177978515625, 1.664764404296875, 1.71173095703125, 1.758697509765625, 1.8056640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 6.0, 7.0, 6.0, 12.0, 16.0, 14.0, 26.0, 26.0, 26.0, 31.0, 28.0, 33.0, 27.0, 50.0, 44.0, 42.0, 44.0, 48.0, 44.0, 35.0, 55.0, 46.0, 43.0, 43.0, 33.0, 32.0, 29.0, 25.0, 23.0, 14.0, 12.0, 18.0, 11.0, 10.0, 15.0, 4.0, 4.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.494140625, -1.4504547119140625, -1.406768798828125, -1.3630828857421875, -1.31939697265625, -1.2757110595703125, -1.232025146484375, -1.1883392333984375, -1.1446533203125, -1.1009674072265625, -1.057281494140625, -1.0135955810546875, -0.96990966796875, -0.9262237548828125, -0.882537841796875, -0.8388519287109375, -0.795166015625, -0.7514801025390625, -0.707794189453125, -0.6641082763671875, -0.62042236328125, -0.5767364501953125, -0.533050537109375, -0.4893646240234375, -0.4456787109375, -0.4019927978515625, -0.358306884765625, -0.3146209716796875, -0.27093505859375, -0.2272491455078125, -0.183563232421875, -0.1398773193359375, -0.09619140625, -0.0525054931640625, -0.008819580078125, 0.0348663330078125, 0.07855224609375, 0.1222381591796875, 0.165924072265625, 0.2096099853515625, 0.2532958984375, 0.2969818115234375, 0.340667724609375, 0.3843536376953125, 0.42803955078125, 0.4717254638671875, 0.515411376953125, 0.5590972900390625, 0.602783203125, 0.6464691162109375, 0.690155029296875, 0.7338409423828125, 0.77752685546875, 0.8212127685546875, 0.864898681640625, 0.9085845947265625, 0.9522705078125, 0.9959564208984375, 1.039642333984375, 1.0833282470703125, 1.12701416015625, 1.1707000732421875, 1.214385986328125, 1.2580718994140625, 1.3017578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 12.0, 14.0, 18.0, 42.0, 59.0, 100.0, 128.0, 238.0, 441.0, 1058.0, 3253.0, 15464.0, 124256.0, 3331894.0, 671204.0, 37195.0, 6235.0, 1563.0, 528.0, 234.0, 134.0, 73.0, 50.0, 37.0, 14.0, 12.0, 7.0, 7.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.088775634765625, -3.97442626953125, -3.860076904296875, -3.7457275390625, -3.631378173828125, -3.51702880859375, -3.402679443359375, -3.288330078125, -3.173980712890625, -3.05963134765625, -2.945281982421875, -2.8309326171875, -2.716583251953125, -2.60223388671875, -2.487884521484375, -2.37353515625, -2.259185791015625, -2.14483642578125, -2.030487060546875, -1.9161376953125, -1.801788330078125, -1.68743896484375, -1.573089599609375, -1.458740234375, -1.344390869140625, -1.23004150390625, -1.115692138671875, -1.0013427734375, -0.886993408203125, -0.77264404296875, -0.658294677734375, -0.5439453125, -0.429595947265625, -0.31524658203125, -0.200897216796875, -0.0865478515625, 0.027801513671875, 0.14215087890625, 0.256500244140625, 0.370849609375, 0.485198974609375, 0.59954833984375, 0.713897705078125, 0.8282470703125, 0.942596435546875, 1.05694580078125, 1.171295166015625, 1.28564453125, 1.399993896484375, 1.51434326171875, 1.628692626953125, 1.7430419921875, 1.857391357421875, 1.97174072265625, 2.086090087890625, 2.200439453125, 2.314788818359375, 2.42913818359375, 2.543487548828125, 2.6578369140625, 2.772186279296875, 2.88653564453125, 3.000885009765625, 3.115234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 6.0, 6.0, 7.0, 14.0, 13.0, 18.0, 25.0, 32.0, 49.0, 62.0, 104.0, 152.0, 235.0, 441.0, 633.0, 733.0, 595.0, 378.0, 196.0, 120.0, 82.0, 51.0, 37.0, 21.0, 20.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-3.984375, -3.882843017578125, -3.78131103515625, -3.679779052734375, -3.5782470703125, -3.476715087890625, -3.37518310546875, -3.273651123046875, -3.172119140625, -3.070587158203125, -2.96905517578125, -2.867523193359375, -2.7659912109375, -2.664459228515625, -2.56292724609375, -2.461395263671875, -2.35986328125, -2.258331298828125, -2.15679931640625, -2.055267333984375, -1.9537353515625, -1.852203369140625, -1.75067138671875, -1.649139404296875, -1.547607421875, -1.446075439453125, -1.34454345703125, -1.243011474609375, -1.1414794921875, -1.039947509765625, -0.93841552734375, -0.836883544921875, -0.7353515625, -0.633819580078125, -0.53228759765625, -0.430755615234375, -0.3292236328125, -0.227691650390625, -0.12615966796875, -0.024627685546875, 0.076904296875, 0.178436279296875, 0.27996826171875, 0.381500244140625, 0.4830322265625, 0.584564208984375, 0.68609619140625, 0.787628173828125, 0.88916015625, 0.990692138671875, 1.09222412109375, 1.193756103515625, 1.2952880859375, 1.396820068359375, 1.49835205078125, 1.599884033203125, 1.701416015625, 1.802947998046875, 1.90447998046875, 2.006011962890625, 2.1075439453125, 2.209075927734375, 2.31060791015625, 2.412139892578125, 2.513671875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 8.0, 9.0, 54.0, 212.0, 377.0, 273.0, 52.0, 8.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.86796569824219, -78.7760009765625, -76.68404388427734, -74.59207916259766, -72.50011444091797, -70.40815734863281, -68.31619262695312, -66.22422790527344, -64.13227081298828, -62.04030990600586, -59.94834518432617, -57.85638427734375, -55.76442337036133, -53.672462463378906, -51.58049774169922, -49.4885368347168, -47.39657211303711, -45.30461120605469, -43.212646484375, -41.12068557739258, -39.028724670410156, -36.93675994873047, -34.84479904174805, -32.752838134765625, -30.66087532043457, -28.568912506103516, -26.476951599121094, -24.38498878479004, -22.293025970458984, -20.201065063476562, -18.109102249145508, -16.017139434814453, -13.925178527832031, -11.833216667175293, -9.741254806518555, -7.6492919921875, -5.557330131530762, -3.4653682708740234, -1.3734054565429688, 0.7185564041137695, 2.810518264770508, 4.902480125427246, 6.994442462921143, 9.086404800415039, 11.178366661071777, 13.270328521728516, 15.36229133605957, 17.454254150390625, 19.546215057373047, 21.6381778717041, 23.730138778686523, 25.822101593017578, 27.9140625, 30.006025314331055, 32.09798812866211, 34.18994903564453, 36.28191375732422, 38.37387466430664, 40.46583938598633, 42.55780029296875, 44.64976119995117, 46.741722106933594, 48.83368682861328, 50.9256477355957, 53.017608642578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 8.0, 10.0, 10.0, 17.0, 14.0, 22.0, 15.0, 28.0, 32.0, 44.0, 43.0, 42.0, 47.0, 38.0, 52.0, 51.0, 49.0, 47.0, 47.0, 51.0, 48.0, 43.0, 30.0, 37.0, 30.0, 22.0, 22.0, 9.0, 14.0, 12.0, 9.0, 12.0, 6.0, 5.0, 5.0, 8.0, 4.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.680658340454102, -14.210269927978516, -13.739882469177246, -13.269495010375977, -12.79910659790039, -12.328718185424805, -11.858330726623535, -11.387943267822266, -10.91755485534668, -10.447166442871094, -9.976778984069824, -9.506391525268555, -9.036003112792969, -8.565614700317383, -8.095227241516113, -7.6248393058776855, -7.154451370239258, -6.68406343460083, -6.213675498962402, -5.743287563323975, -5.272899627685547, -4.802511692047119, -4.332123756408691, -3.8617358207702637, -3.391347885131836, -2.920959949493408, -2.4505720138549805, -1.9801840782165527, -1.509796142578125, -1.0394082069396973, -0.5690202713012695, -0.0986323356628418, 0.37175655364990234, 0.8421444892883301, 1.3125324249267578, 1.7829203605651855, 2.2533082962036133, 2.723696231842041, 3.1940841674804688, 3.6644721031188965, 4.134860038757324, 4.605247974395752, 5.07563591003418, 5.546023845672607, 6.016411781311035, 6.486799716949463, 6.957187652587891, 7.427575588226318, 7.897963523864746, 8.368350982666016, 8.838739395141602, 9.309127807617188, 9.779515266418457, 10.249902725219727, 10.720291137695312, 11.190679550170898, 11.661067008972168, 12.131454467773438, 12.601842880249023, 13.07223129272461, 13.542618751525879, 14.013006210327148, 14.483394622802734, 14.95378303527832, 15.42417049407959]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 10.0, 15.0, 22.0, 41.0, 57.0, 121.0, 216.0, 342.0, 603.0, 1138.0, 1972.0, 3689.0, 7761.0, 16836.0, 38164.0, 85422.0, 189242.0, 302493.0, 216952.0, 100545.0, 44539.0, 20098.0, 9105.0, 4216.0, 2166.0, 1217.0, 645.0, 387.0, 215.0, 130.0, 92.0, 43.0, 22.0, 19.0, 9.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.046875, -1.9840850830078125, -1.921295166015625, -1.8585052490234375, -1.79571533203125, -1.7329254150390625, -1.670135498046875, -1.6073455810546875, -1.5445556640625, -1.4817657470703125, -1.418975830078125, -1.3561859130859375, -1.29339599609375, -1.2306060791015625, -1.167816162109375, -1.1050262451171875, -1.042236328125, -0.9794464111328125, -0.916656494140625, -0.8538665771484375, -0.79107666015625, -0.7282867431640625, -0.665496826171875, -0.6027069091796875, -0.5399169921875, -0.4771270751953125, -0.414337158203125, -0.3515472412109375, -0.28875732421875, -0.2259674072265625, -0.163177490234375, -0.1003875732421875, -0.03759765625, 0.0251922607421875, 0.087982177734375, 0.1507720947265625, 0.21356201171875, 0.2763519287109375, 0.339141845703125, 0.4019317626953125, 0.4647216796875, 0.5275115966796875, 0.590301513671875, 0.6530914306640625, 0.71588134765625, 0.7786712646484375, 0.841461181640625, 0.9042510986328125, 0.967041015625, 1.0298309326171875, 1.092620849609375, 1.1554107666015625, 1.21820068359375, 1.2809906005859375, 1.343780517578125, 1.4065704345703125, 1.4693603515625, 1.5321502685546875, 1.594940185546875, 1.6577301025390625, 1.72052001953125, 1.7833099365234375, 1.846099853515625, 1.9088897705078125, 1.9716796875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 10.0, 5.0, 10.0, 20.0, 21.0, 22.0, 26.0, 21.0, 34.0, 35.0, 28.0, 42.0, 40.0, 33.0, 37.0, 42.0, 45.0, 44.0, 42.0, 45.0, 45.0, 42.0, 33.0, 26.0, 33.0, 29.0, 25.0, 25.0, 21.0, 16.0, 14.0, 18.0, 18.0, 8.0, 4.0, 7.0, 8.0, 10.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.26953125, -1.229156494140625, -1.18878173828125, -1.148406982421875, -1.1080322265625, -1.067657470703125, -1.02728271484375, -0.986907958984375, -0.946533203125, -0.906158447265625, -0.86578369140625, -0.825408935546875, -0.7850341796875, -0.744659423828125, -0.70428466796875, -0.663909912109375, -0.62353515625, -0.583160400390625, -0.54278564453125, -0.502410888671875, -0.4620361328125, -0.421661376953125, -0.38128662109375, -0.340911865234375, -0.300537109375, -0.260162353515625, -0.21978759765625, -0.179412841796875, -0.1390380859375, -0.098663330078125, -0.05828857421875, -0.017913818359375, 0.0224609375, 0.062835693359375, 0.10321044921875, 0.143585205078125, 0.1839599609375, 0.224334716796875, 0.26470947265625, 0.305084228515625, 0.345458984375, 0.385833740234375, 0.42620849609375, 0.466583251953125, 0.5069580078125, 0.547332763671875, 0.58770751953125, 0.628082275390625, 0.66845703125, 0.708831787109375, 0.74920654296875, 0.789581298828125, 0.8299560546875, 0.870330810546875, 0.91070556640625, 0.951080322265625, 0.991455078125, 1.031829833984375, 1.07220458984375, 1.112579345703125, 1.1529541015625, 1.193328857421875, 1.23370361328125, 1.274078369140625, 1.314453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 9.0, 12.0, 17.0, 12.0, 33.0, 22.0, 66.0, 71.0, 113.0, 140.0, 206.0, 353.0, 576.0, 994.0, 2151.0, 6231.0, 36703.0, 367383.0, 576720.0, 44234.0, 7282.0, 2286.0, 1106.0, 617.0, 382.0, 252.0, 177.0, 106.0, 86.0, 65.0, 46.0, 31.0, 18.0, 16.0, 14.0, 6.0, 9.0, 6.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.8359375, -4.67498779296875, -4.5140380859375, -4.35308837890625, -4.192138671875, -4.03118896484375, -3.8702392578125, -3.70928955078125, -3.54833984375, -3.38739013671875, -3.2264404296875, -3.06549072265625, -2.904541015625, -2.74359130859375, -2.5826416015625, -2.42169189453125, -2.2607421875, -2.09979248046875, -1.9388427734375, -1.77789306640625, -1.616943359375, -1.45599365234375, -1.2950439453125, -1.13409423828125, -0.97314453125, -0.81219482421875, -0.6512451171875, -0.49029541015625, -0.329345703125, -0.16839599609375, -0.0074462890625, 0.15350341796875, 0.314453125, 0.47540283203125, 0.6363525390625, 0.79730224609375, 0.958251953125, 1.11920166015625, 1.2801513671875, 1.44110107421875, 1.60205078125, 1.76300048828125, 1.9239501953125, 2.08489990234375, 2.245849609375, 2.40679931640625, 2.5677490234375, 2.72869873046875, 2.8896484375, 3.05059814453125, 3.2115478515625, 3.37249755859375, 3.533447265625, 3.69439697265625, 3.8553466796875, 4.01629638671875, 4.17724609375, 4.33819580078125, 4.4991455078125, 4.66009521484375, 4.821044921875, 4.98199462890625, 5.1429443359375, 5.30389404296875, 5.46484375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 12.0, 6.0, 3.0, 5.0, 11.0, 10.0, 12.0, 16.0, 17.0, 21.0, 28.0, 29.0, 37.0, 39.0, 50.0, 47.0, 53.0, 60.0, 52.0, 50.0, 52.0, 46.0, 39.0, 53.0, 35.0, 36.0, 31.0, 33.0, 23.0, 24.0, 10.0, 14.0, 14.0, 8.0, 7.0, 5.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.15234375, -5.97381591796875, -5.7952880859375, -5.61676025390625, -5.438232421875, -5.25970458984375, -5.0811767578125, -4.90264892578125, -4.72412109375, -4.54559326171875, -4.3670654296875, -4.18853759765625, -4.010009765625, -3.83148193359375, -3.6529541015625, -3.47442626953125, -3.2958984375, -3.11737060546875, -2.9388427734375, -2.76031494140625, -2.581787109375, -2.40325927734375, -2.2247314453125, -2.04620361328125, -1.86767578125, -1.68914794921875, -1.5106201171875, -1.33209228515625, -1.153564453125, -0.97503662109375, -0.7965087890625, -0.61798095703125, -0.439453125, -0.26092529296875, -0.0823974609375, 0.09613037109375, 0.274658203125, 0.45318603515625, 0.6317138671875, 0.81024169921875, 0.98876953125, 1.16729736328125, 1.3458251953125, 1.52435302734375, 1.702880859375, 1.88140869140625, 2.0599365234375, 2.23846435546875, 2.4169921875, 2.59552001953125, 2.7740478515625, 2.95257568359375, 3.131103515625, 3.30963134765625, 3.4881591796875, 3.66668701171875, 3.84521484375, 4.02374267578125, 4.2022705078125, 4.38079833984375, 4.559326171875, 4.73785400390625, 4.9163818359375, 5.09490966796875, 5.2734375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 5.0, 6.0, 8.0, 13.0, 11.0, 19.0, 25.0, 54.0, 108.0, 214.0, 318.0, 769.0, 1749.0, 4539.0, 14818.0, 79739.0, 648344.0, 247800.0, 36237.0, 8560.0, 2945.0, 1161.0, 534.0, 253.0, 133.0, 76.0, 37.0, 22.0, 21.0, 18.0, 7.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.240234375, -1.1971435546875, -1.154052734375, -1.1109619140625, -1.06787109375, -1.0247802734375, -0.981689453125, -0.9385986328125, -0.8955078125, -0.8524169921875, -0.809326171875, -0.7662353515625, -0.72314453125, -0.6800537109375, -0.636962890625, -0.5938720703125, -0.55078125, -0.5076904296875, -0.464599609375, -0.4215087890625, -0.37841796875, -0.3353271484375, -0.292236328125, -0.2491455078125, -0.2060546875, -0.1629638671875, -0.119873046875, -0.0767822265625, -0.03369140625, 0.0093994140625, 0.052490234375, 0.0955810546875, 0.138671875, 0.1817626953125, 0.224853515625, 0.2679443359375, 0.31103515625, 0.3541259765625, 0.397216796875, 0.4403076171875, 0.4833984375, 0.5264892578125, 0.569580078125, 0.6126708984375, 0.65576171875, 0.6988525390625, 0.741943359375, 0.7850341796875, 0.828125, 0.8712158203125, 0.914306640625, 0.9573974609375, 1.00048828125, 1.0435791015625, 1.086669921875, 1.1297607421875, 1.1728515625, 1.2159423828125, 1.259033203125, 1.3021240234375, 1.34521484375, 1.3883056640625, 1.431396484375, 1.4744873046875, 1.517578125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 3.0, 1.0, 3.0, 6.0, 2.0, 9.0, 10.0, 24.0, 31.0, 49.0, 57.0, 89.0, 122.0, 124.0, 134.0, 93.0, 70.0, 48.0, 37.0, 22.0, 16.0, 23.0, 5.0, 10.0, 2.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003993511199951172, -0.0003844834864139557, -0.0003696158528327942, -0.0003547482192516327, -0.0003398805856704712, -0.0003250129520893097, -0.0003101453185081482, -0.0002952776849269867, -0.0002804100513458252, -0.0002655424177646637, -0.0002506747841835022, -0.0002358071506023407, -0.0002209395170211792, -0.0002060718834400177, -0.0001912042498588562, -0.0001763366162776947, -0.0001614689826965332, -0.0001466013491153717, -0.0001317337155342102, -0.0001168660819530487, -0.00010199844837188721, -8.713081479072571e-05, -7.226318120956421e-05, -5.739554762840271e-05, -4.252791404724121e-05, -2.7660280466079712e-05, -1.2792646884918213e-05, 2.074986696243286e-06, 1.6942620277404785e-05, 3.1810253858566284e-05, 4.667788743972778e-05, 6.154552102088928e-05, 7.641315460205078e-05, 9.128078818321228e-05, 0.00010614842176437378, 0.00012101605534553528, 0.00013588368892669678, 0.00015075132250785828, 0.00016561895608901978, 0.00018048658967018127, 0.00019535422325134277, 0.00021022185683250427, 0.00022508949041366577, 0.00023995712399482727, 0.00025482475757598877, 0.00026969239115715027, 0.00028456002473831177, 0.00029942765831947327, 0.00031429529190063477, 0.00032916292548179626, 0.00034403055906295776, 0.00035889819264411926, 0.00037376582622528076, 0.00038863345980644226, 0.00040350109338760376, 0.00041836872696876526, 0.00043323636054992676, 0.00044810399413108826, 0.00046297162771224976, 0.00047783926129341125, 0.0004927068948745728, 0.0005075745284557343, 0.0005224421620368958, 0.0005373097956180573, 0.0005521774291992188]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 9.0, 9.0, 17.0, 16.0, 25.0, 33.0, 55.0, 59.0, 113.0, 166.0, 238.0, 398.0, 778.0, 1469.0, 3538.0, 9589.0, 36576.0, 204606.0, 640633.0, 115516.0, 22579.0, 6733.0, 2589.0, 1184.0, 595.0, 351.0, 227.0, 136.0, 86.0, 60.0, 38.0, 33.0, 29.0, 22.0, 11.0, 6.0, 4.0, 1.0, 3.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-1.189453125, -1.154815673828125, -1.12017822265625, -1.085540771484375, -1.0509033203125, -1.016265869140625, -0.98162841796875, -0.946990966796875, -0.912353515625, -0.877716064453125, -0.84307861328125, -0.808441162109375, -0.7738037109375, -0.739166259765625, -0.70452880859375, -0.669891357421875, -0.63525390625, -0.600616455078125, -0.56597900390625, -0.531341552734375, -0.4967041015625, -0.462066650390625, -0.42742919921875, -0.392791748046875, -0.358154296875, -0.323516845703125, -0.28887939453125, -0.254241943359375, -0.2196044921875, -0.184967041015625, -0.15032958984375, -0.115692138671875, -0.0810546875, -0.046417236328125, -0.01177978515625, 0.022857666015625, 0.0574951171875, 0.092132568359375, 0.12677001953125, 0.161407470703125, 0.196044921875, 0.230682373046875, 0.26531982421875, 0.299957275390625, 0.3345947265625, 0.369232177734375, 0.40386962890625, 0.438507080078125, 0.47314453125, 0.507781982421875, 0.54241943359375, 0.577056884765625, 0.6116943359375, 0.646331787109375, 0.68096923828125, 0.715606689453125, 0.750244140625, 0.784881591796875, 0.81951904296875, 0.854156494140625, 0.8887939453125, 0.923431396484375, 0.95806884765625, 0.992706298828125, 1.02734375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 4.0, 6.0, 10.0, 5.0, 10.0, 11.0, 7.0, 13.0, 16.0, 32.0, 37.0, 47.0, 33.0, 60.0, 76.0, 88.0, 81.0, 86.0, 69.0, 67.0, 54.0, 39.0, 27.0, 23.0, 16.0, 14.0, 10.0, 13.0, 8.0, 8.0, 4.0, 5.0, 3.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98876953125, -0.9530105590820312, -0.9172515869140625, -0.8814926147460938, -0.845733642578125, -0.8099746704101562, -0.7742156982421875, -0.7384567260742188, -0.70269775390625, -0.6669387817382812, -0.6311798095703125, -0.5954208374023438, -0.559661865234375, -0.5239028930664062, -0.4881439208984375, -0.45238494873046875, -0.4166259765625, -0.38086700439453125, -0.3451080322265625, -0.30934906005859375, -0.273590087890625, -0.23783111572265625, -0.2020721435546875, -0.16631317138671875, -0.13055419921875, -0.09479522705078125, -0.0590362548828125, -0.02327728271484375, 0.012481689453125, 0.04824066162109375, 0.0839996337890625, 0.11975860595703125, 0.155517578125, 0.19127655029296875, 0.2270355224609375, 0.26279449462890625, 0.298553466796875, 0.33431243896484375, 0.3700714111328125, 0.40583038330078125, 0.44158935546875, 0.47734832763671875, 0.5131072998046875, 0.5488662719726562, 0.584625244140625, 0.6203842163085938, 0.6561431884765625, 0.6919021606445312, 0.7276611328125, 0.7634201049804688, 0.7991790771484375, 0.8349380493164062, 0.870697021484375, 0.9064559936523438, 0.9422149658203125, 0.9779739379882812, 1.01373291015625, 1.0494918823242188, 1.0852508544921875, 1.1210098266601562, 1.156768798828125, 1.1925277709960938, 1.2282867431640625, 1.2640457153320312, 1.2998046875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 1.0, 10.0, 17.0, 30.0, 66.0, 113.0, 184.0, 259.0, 133.0, 90.0, 44.0, 20.0, 10.0, 10.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.882457733154297, -28.825586318969727, -27.768714904785156, -26.71184539794922, -25.65497398376465, -24.598102569580078, -23.54123306274414, -22.48436164855957, -21.427490234375, -20.37061882019043, -19.31374740600586, -18.256877899169922, -17.20000648498535, -16.14313507080078, -15.086264610290527, -14.029394149780273, -12.972522735595703, -11.915651321411133, -10.858780860900879, -9.801910400390625, -8.745038986206055, -7.688168048858643, -6.6312971115112305, -5.574426174163818, -4.517555236816406, -3.460684299468994, -2.403813362121582, -1.34694242477417, -0.2900714874267578, 0.7667994499206543, 1.8236703872680664, 2.8805413246154785, 3.9374122619628906, 4.994283199310303, 6.051154136657715, 7.108025074005127, 8.164896011352539, 9.22176742553711, 10.278637886047363, 11.335508346557617, 12.392379760742188, 13.449251174926758, 14.506121635437012, 15.562992095947266, 16.619863510131836, 17.676734924316406, 18.733604431152344, 19.790475845336914, 20.847347259521484, 21.904218673706055, 22.961090087890625, 24.017959594726562, 25.074831008911133, 26.131702423095703, 27.18857192993164, 28.24544334411621, 29.30231475830078, 30.35918617248535, 31.416057586669922, 32.47292709350586, 33.52980041503906, 34.586669921875, 35.64353942871094, 36.70041275024414, 37.75728225708008]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 6.0, 7.0, 14.0, 11.0, 12.0, 16.0, 18.0, 12.0, 23.0, 31.0, 41.0, 30.0, 34.0, 26.0, 42.0, 54.0, 59.0, 92.0, 76.0, 47.0, 51.0, 41.0, 41.0, 41.0, 28.0, 22.0, 25.0, 12.0, 15.0, 15.0, 11.0, 11.0, 10.0, 7.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.954669952392578, -23.2232666015625, -22.491863250732422, -21.760459899902344, -21.029054641723633, -20.297651290893555, -19.566247940063477, -18.8348445892334, -18.10344123840332, -17.372037887573242, -16.640634536743164, -15.90923023223877, -15.177826881408691, -14.446422576904297, -13.715019226074219, -12.98361587524414, -12.252211570739746, -11.520808219909668, -10.789403915405273, -10.058000564575195, -9.326597213745117, -8.595193862915039, -7.8637895584106445, -7.132386207580566, -6.40098237991333, -5.669578552246094, -4.938175201416016, -4.206771373748779, -3.475367784500122, -2.743964195251465, -2.0125603675842285, -1.2811570167541504, -0.5497531890869141, 0.18165045976638794, 0.9130541086196899, 1.6444578170776367, 2.375861406326294, 3.107264995574951, 3.8386688232421875, 4.570072174072266, 5.301476001739502, 6.032879829406738, 6.764283180236816, 7.495687007904053, 8.227090835571289, 8.958494186401367, 9.689897537231445, 10.421300888061523, 11.152705192565918, 11.884108543395996, 12.61551284790039, 13.346916198730469, 14.078319549560547, 14.809722900390625, 15.54112720489502, 16.27252960205078, 17.003934860229492, 17.73533821105957, 18.46674156188965, 19.19814682006836, 19.929550170898438, 20.660953521728516, 21.392356872558594, 22.123760223388672, 22.85516357421875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 8.0, 8.0, 14.0, 24.0, 29.0, 31.0, 55.0, 54.0, 96.0, 114.0, 193.0, 386.0, 794.0, 1994.0, 6025.0, 27012.0, 228568.0, 2082903.0, 1661217.0, 155994.0, 20303.0, 4993.0, 1727.0, 748.0, 335.0, 183.0, 122.0, 78.0, 64.0, 49.0, 44.0, 29.0, 21.0, 16.0, 6.0, 9.0, 3.0, 9.0, 0.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.7734375, -1.712127685546875, -1.65081787109375, -1.589508056640625, -1.5281982421875, -1.466888427734375, -1.40557861328125, -1.344268798828125, -1.282958984375, -1.221649169921875, -1.16033935546875, -1.099029541015625, -1.0377197265625, -0.976409912109375, -0.91510009765625, -0.853790283203125, -0.79248046875, -0.731170654296875, -0.66986083984375, -0.608551025390625, -0.5472412109375, -0.485931396484375, -0.42462158203125, -0.363311767578125, -0.302001953125, -0.240692138671875, -0.17938232421875, -0.118072509765625, -0.0567626953125, 0.004547119140625, 0.06585693359375, 0.127166748046875, 0.1884765625, 0.249786376953125, 0.31109619140625, 0.372406005859375, 0.4337158203125, 0.495025634765625, 0.55633544921875, 0.617645263671875, 0.678955078125, 0.740264892578125, 0.80157470703125, 0.862884521484375, 0.9241943359375, 0.985504150390625, 1.04681396484375, 1.108123779296875, 1.16943359375, 1.230743408203125, 1.29205322265625, 1.353363037109375, 1.4146728515625, 1.475982666015625, 1.53729248046875, 1.598602294921875, 1.659912109375, 1.721221923828125, 1.78253173828125, 1.843841552734375, 1.9051513671875, 1.966461181640625, 2.02777099609375, 2.089080810546875, 2.150390625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 11.0, 8.0, 11.0, 11.0, 18.0, 13.0, 24.0, 20.0, 18.0, 31.0, 24.0, 36.0, 43.0, 37.0, 35.0, 40.0, 32.0, 40.0, 49.0, 47.0, 39.0, 59.0, 37.0, 45.0, 42.0, 29.0, 33.0, 29.0, 13.0, 22.0, 11.0, 18.0, 15.0, 12.0, 12.0, 8.0, 8.0, 3.0, 5.0, 2.0, 2.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.2353515625, -1.198638916015625, -1.16192626953125, -1.125213623046875, -1.0885009765625, -1.051788330078125, -1.01507568359375, -0.978363037109375, -0.941650390625, -0.904937744140625, -0.86822509765625, -0.831512451171875, -0.7947998046875, -0.758087158203125, -0.72137451171875, -0.684661865234375, -0.64794921875, -0.611236572265625, -0.57452392578125, -0.537811279296875, -0.5010986328125, -0.464385986328125, -0.42767333984375, -0.390960693359375, -0.354248046875, -0.317535400390625, -0.28082275390625, -0.244110107421875, -0.2073974609375, -0.170684814453125, -0.13397216796875, -0.097259521484375, -0.060546875, -0.023834228515625, 0.01287841796875, 0.049591064453125, 0.0863037109375, 0.123016357421875, 0.15972900390625, 0.196441650390625, 0.233154296875, 0.269866943359375, 0.30657958984375, 0.343292236328125, 0.3800048828125, 0.416717529296875, 0.45343017578125, 0.490142822265625, 0.52685546875, 0.563568115234375, 0.60028076171875, 0.636993408203125, 0.6737060546875, 0.710418701171875, 0.74713134765625, 0.783843994140625, 0.820556640625, 0.857269287109375, 0.89398193359375, 0.930694580078125, 0.9674072265625, 1.004119873046875, 1.04083251953125, 1.077545166015625, 1.1142578125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 19.0, 26.0, 34.0, 91.0, 150.0, 310.0, 888.0, 8273.0, 3406791.0, 772252.0, 4405.0, 630.0, 216.0, 100.0, 51.0, 22.0, 9.0, 11.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7734375, -8.51470947265625, -8.2559814453125, -7.99725341796875, -7.738525390625, -7.47979736328125, -7.2210693359375, -6.96234130859375, -6.70361328125, -6.44488525390625, -6.1861572265625, -5.92742919921875, -5.668701171875, -5.40997314453125, -5.1512451171875, -4.89251708984375, -4.6337890625, -4.37506103515625, -4.1163330078125, -3.85760498046875, -3.598876953125, -3.34014892578125, -3.0814208984375, -2.82269287109375, -2.56396484375, -2.30523681640625, -2.0465087890625, -1.78778076171875, -1.529052734375, -1.27032470703125, -1.0115966796875, -0.75286865234375, -0.494140625, -0.23541259765625, 0.0233154296875, 0.28204345703125, 0.540771484375, 0.79949951171875, 1.0582275390625, 1.31695556640625, 1.57568359375, 1.83441162109375, 2.0931396484375, 2.35186767578125, 2.610595703125, 2.86932373046875, 3.1280517578125, 3.38677978515625, 3.6455078125, 3.90423583984375, 4.1629638671875, 4.42169189453125, 4.680419921875, 4.93914794921875, 5.1978759765625, 5.45660400390625, 5.71533203125, 5.97406005859375, 6.2327880859375, 6.49151611328125, 6.750244140625, 7.00897216796875, 7.2677001953125, 7.52642822265625, 7.78515625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 14.0, 22.0, 31.0, 43.0, 67.0, 154.0, 346.0, 691.0, 1127.0, 865.0, 361.0, 168.0, 79.0, 36.0, 28.0, 14.0, 8.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.55078125, -6.409912109375, -6.26904296875, -6.128173828125, -5.9873046875, -5.846435546875, -5.70556640625, -5.564697265625, -5.423828125, -5.282958984375, -5.14208984375, -5.001220703125, -4.8603515625, -4.719482421875, -4.57861328125, -4.437744140625, -4.296875, -4.156005859375, -4.01513671875, -3.874267578125, -3.7333984375, -3.592529296875, -3.45166015625, -3.310791015625, -3.169921875, -3.029052734375, -2.88818359375, -2.747314453125, -2.6064453125, -2.465576171875, -2.32470703125, -2.183837890625, -2.04296875, -1.902099609375, -1.76123046875, -1.620361328125, -1.4794921875, -1.338623046875, -1.19775390625, -1.056884765625, -0.916015625, -0.775146484375, -0.63427734375, -0.493408203125, -0.3525390625, -0.211669921875, -0.07080078125, 0.070068359375, 0.2109375, 0.351806640625, 0.49267578125, 0.633544921875, 0.7744140625, 0.915283203125, 1.05615234375, 1.197021484375, 1.337890625, 1.478759765625, 1.61962890625, 1.760498046875, 1.9013671875, 2.042236328125, 2.18310546875, 2.323974609375, 2.46484375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 17.0, 29.0, 122.0, 352.0, 333.0, 108.0, 14.0, 10.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.719482421875, -86.83426666259766, -84.94905853271484, -83.0638427734375, -81.17863464355469, -79.29341888427734, -77.40821075439453, -75.52299499511719, -73.63778686523438, -71.75257110595703, -69.86736297607422, -67.98214721679688, -66.09693908691406, -64.21172332763672, -62.32651138305664, -60.44129943847656, -58.55608367919922, -56.67087173461914, -54.78565979003906, -52.900447845458984, -51.015235900878906, -49.13002014160156, -47.244808197021484, -45.359596252441406, -43.47438430786133, -41.58917236328125, -39.70396041870117, -37.818748474121094, -35.93353271484375, -34.04832458496094, -32.163108825683594, -30.277896881103516, -28.392684936523438, -26.50747299194336, -24.62226104736328, -22.73704719543457, -20.851835250854492, -18.966623306274414, -17.081409454345703, -15.196197509765625, -13.310985565185547, -11.425773620605469, -9.540560722351074, -7.655348300933838, -5.770135879516602, -3.8849239349365234, -1.999711036682129, -0.11449813842773438, 1.7707138061523438, 3.65592622756958, 5.541138648986816, 7.426351070404053, 9.311563491821289, 11.196775436401367, 13.081988334655762, 14.967201232910156, 16.852413177490234, 18.737625122070312, 20.62283706665039, 22.5080509185791, 24.39326286315918, 26.278474807739258, 28.16368865966797, 30.048900604248047, 31.934112548828125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 6.0, 9.0, 18.0, 8.0, 17.0, 21.0, 20.0, 27.0, 23.0, 36.0, 34.0, 38.0, 41.0, 51.0, 41.0, 36.0, 52.0, 63.0, 44.0, 66.0, 38.0, 40.0, 46.0, 47.0, 31.0, 27.0, 23.0, 14.0, 12.0, 16.0, 10.0, 9.0, 5.0, 6.0, 2.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.791007041931152, -12.32728385925293, -11.86355972290039, -11.399836540222168, -10.936113357543945, -10.472389221191406, -10.008666038513184, -9.544942855834961, -9.081218719482422, -8.6174955368042, -8.15377140045166, -7.6900482177734375, -7.226325035095215, -6.762601375579834, -6.298877716064453, -5.8351545333862305, -5.371431350708008, -4.907707691192627, -4.443984508514404, -3.9802608489990234, -3.5165374279022217, -3.05281400680542, -2.589090347290039, -2.1253669261932373, -1.6616435050964355, -1.1979200839996338, -0.7341965436935425, -0.27047300338745117, 0.19325041770935059, 0.6569738388061523, 1.1206974983215332, 1.584420919418335, 2.048145294189453, 2.511868715286255, 2.9755921363830566, 3.4393157958984375, 3.9030392169952393, 4.366762638092041, 4.830486297607422, 5.2942094802856445, 5.757933139801025, 6.221656799316406, 6.685379981994629, 7.14910364151001, 7.612827301025391, 8.076550483703613, 8.540273666381836, 9.003997802734375, 9.467720985412598, 9.93144416809082, 10.39516830444336, 10.858891487121582, 11.322614669799805, 11.786338806152344, 12.250061988830566, 12.713785171508789, 13.177509307861328, 13.64123249053955, 14.10495662689209, 14.568679809570312, 15.032402992248535, 15.496126174926758, 15.959850311279297, 16.423574447631836, 16.887296676635742]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 15.0, 28.0, 50.0, 47.0, 97.0, 148.0, 208.0, 335.0, 545.0, 890.0, 1445.0, 2418.0, 4055.0, 7397.0, 13250.0, 24377.0, 45501.0, 84066.0, 143970.0, 201899.0, 199002.0, 140314.0, 81858.0, 43887.0, 23179.0, 12673.0, 6993.0, 4034.0, 2305.0, 1348.0, 798.0, 499.0, 330.0, 184.0, 139.0, 92.0, 63.0, 37.0, 22.0, 20.0, 14.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1953125, -1.155426025390625, -1.11553955078125, -1.075653076171875, -1.0357666015625, -0.995880126953125, -0.95599365234375, -0.916107177734375, -0.876220703125, -0.836334228515625, -0.79644775390625, -0.756561279296875, -0.7166748046875, -0.676788330078125, -0.63690185546875, -0.597015380859375, -0.55712890625, -0.517242431640625, -0.47735595703125, -0.437469482421875, -0.3975830078125, -0.357696533203125, -0.31781005859375, -0.277923583984375, -0.238037109375, -0.198150634765625, -0.15826416015625, -0.118377685546875, -0.0784912109375, -0.038604736328125, 0.00128173828125, 0.041168212890625, 0.0810546875, 0.120941162109375, 0.16082763671875, 0.200714111328125, 0.2406005859375, 0.280487060546875, 0.32037353515625, 0.360260009765625, 0.400146484375, 0.440032958984375, 0.47991943359375, 0.519805908203125, 0.5596923828125, 0.599578857421875, 0.63946533203125, 0.679351806640625, 0.71923828125, 0.759124755859375, 0.79901123046875, 0.838897705078125, 0.8787841796875, 0.918670654296875, 0.95855712890625, 0.998443603515625, 1.038330078125, 1.078216552734375, 1.11810302734375, 1.157989501953125, 1.1978759765625, 1.237762451171875, 1.27764892578125, 1.317535400390625, 1.357421875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 5.0, 14.0, 15.0, 18.0, 14.0, 14.0, 17.0, 28.0, 23.0, 30.0, 30.0, 31.0, 28.0, 31.0, 31.0, 39.0, 40.0, 33.0, 40.0, 47.0, 44.0, 37.0, 51.0, 37.0, 30.0, 28.0, 30.0, 32.0, 30.0, 17.0, 30.0, 18.0, 9.0, 10.0, 13.0, 9.0, 9.0, 7.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0703125, -1.0332794189453125, -0.996246337890625, -0.9592132568359375, -0.92218017578125, -0.8851470947265625, -0.848114013671875, -0.8110809326171875, -0.7740478515625, -0.7370147705078125, -0.699981689453125, -0.6629486083984375, -0.62591552734375, -0.5888824462890625, -0.551849365234375, -0.5148162841796875, -0.477783203125, -0.4407501220703125, -0.403717041015625, -0.3666839599609375, -0.32965087890625, -0.2926177978515625, -0.255584716796875, -0.2185516357421875, -0.1815185546875, -0.1444854736328125, -0.107452392578125, -0.0704193115234375, -0.03338623046875, 0.0036468505859375, 0.040679931640625, 0.0777130126953125, 0.11474609375, 0.1517791748046875, 0.188812255859375, 0.2258453369140625, 0.26287841796875, 0.2999114990234375, 0.336944580078125, 0.3739776611328125, 0.4110107421875, 0.4480438232421875, 0.485076904296875, 0.5221099853515625, 0.55914306640625, 0.5961761474609375, 0.633209228515625, 0.6702423095703125, 0.707275390625, 0.7443084716796875, 0.781341552734375, 0.8183746337890625, 0.85540771484375, 0.8924407958984375, 0.929473876953125, 0.9665069580078125, 1.0035400390625, 1.0405731201171875, 1.077606201171875, 1.1146392822265625, 1.15167236328125, 1.1887054443359375, 1.225738525390625, 1.2627716064453125, 1.2998046875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 6.0, 8.0, 18.0, 21.0, 28.0, 35.0, 62.0, 87.0, 155.0, 222.0, 487.0, 1327.0, 4667.0, 23770.0, 189205.0, 702398.0, 106204.0, 14696.0, 3210.0, 955.0, 411.0, 216.0, 108.0, 79.0, 49.0, 38.0, 25.0, 9.0, 14.0, 7.0, 10.0, 9.0, 5.0, 2.0, 2.0, 0.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.796875, -4.65728759765625, -4.5177001953125, -4.37811279296875, -4.238525390625, -4.09893798828125, -3.9593505859375, -3.81976318359375, -3.68017578125, -3.54058837890625, -3.4010009765625, -3.26141357421875, -3.121826171875, -2.98223876953125, -2.8426513671875, -2.70306396484375, -2.5634765625, -2.42388916015625, -2.2843017578125, -2.14471435546875, -2.005126953125, -1.86553955078125, -1.7259521484375, -1.58636474609375, -1.44677734375, -1.30718994140625, -1.1676025390625, -1.02801513671875, -0.888427734375, -0.74884033203125, -0.6092529296875, -0.46966552734375, -0.330078125, -0.19049072265625, -0.0509033203125, 0.08868408203125, 0.228271484375, 0.36785888671875, 0.5074462890625, 0.64703369140625, 0.78662109375, 0.92620849609375, 1.0657958984375, 1.20538330078125, 1.344970703125, 1.48455810546875, 1.6241455078125, 1.76373291015625, 1.9033203125, 2.04290771484375, 2.1824951171875, 2.32208251953125, 2.461669921875, 2.60125732421875, 2.7408447265625, 2.88043212890625, 3.02001953125, 3.15960693359375, 3.2991943359375, 3.43878173828125, 3.578369140625, 3.71795654296875, 3.8575439453125, 3.99713134765625, 4.13671875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 4.0, 6.0, 6.0, 7.0, 10.0, 17.0, 13.0, 19.0, 19.0, 19.0, 32.0, 41.0, 33.0, 40.0, 43.0, 36.0, 40.0, 46.0, 59.0, 46.0, 54.0, 49.0, 51.0, 46.0, 33.0, 33.0, 37.0, 25.0, 21.0, 18.0, 10.0, 15.0, 11.0, 9.0, 14.0, 8.0, 6.0, 7.0, 2.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.75, -4.59423828125, -4.4384765625, -4.28271484375, -4.126953125, -3.97119140625, -3.8154296875, -3.65966796875, -3.50390625, -3.34814453125, -3.1923828125, -3.03662109375, -2.880859375, -2.72509765625, -2.5693359375, -2.41357421875, -2.2578125, -2.10205078125, -1.9462890625, -1.79052734375, -1.634765625, -1.47900390625, -1.3232421875, -1.16748046875, -1.01171875, -0.85595703125, -0.7001953125, -0.54443359375, -0.388671875, -0.23291015625, -0.0771484375, 0.07861328125, 0.234375, 0.39013671875, 0.5458984375, 0.70166015625, 0.857421875, 1.01318359375, 1.1689453125, 1.32470703125, 1.48046875, 1.63623046875, 1.7919921875, 1.94775390625, 2.103515625, 2.25927734375, 2.4150390625, 2.57080078125, 2.7265625, 2.88232421875, 3.0380859375, 3.19384765625, 3.349609375, 3.50537109375, 3.6611328125, 3.81689453125, 3.97265625, 4.12841796875, 4.2841796875, 4.43994140625, 4.595703125, 4.75146484375, 4.9072265625, 5.06298828125, 5.21875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 8.0, 6.0, 10.0, 13.0, 18.0, 39.0, 60.0, 67.0, 130.0, 211.0, 408.0, 708.0, 1521.0, 3383.0, 9765.0, 38504.0, 234240.0, 650586.0, 81878.0, 17206.0, 5446.0, 2162.0, 990.0, 457.0, 295.0, 184.0, 104.0, 64.0, 25.0, 22.0, 13.0, 11.0, 13.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.568359375, -1.5225372314453125, -1.476715087890625, -1.4308929443359375, -1.38507080078125, -1.3392486572265625, -1.293426513671875, -1.2476043701171875, -1.2017822265625, -1.1559600830078125, -1.110137939453125, -1.0643157958984375, -1.01849365234375, -0.9726715087890625, -0.926849365234375, -0.8810272216796875, -0.835205078125, -0.7893829345703125, -0.743560791015625, -0.6977386474609375, -0.65191650390625, -0.6060943603515625, -0.560272216796875, -0.5144500732421875, -0.4686279296875, -0.4228057861328125, -0.376983642578125, -0.3311614990234375, -0.28533935546875, -0.2395172119140625, -0.193695068359375, -0.1478729248046875, -0.10205078125, -0.0562286376953125, -0.010406494140625, 0.0354156494140625, 0.08123779296875, 0.1270599365234375, 0.172882080078125, 0.2187042236328125, 0.2645263671875, 0.3103485107421875, 0.356170654296875, 0.4019927978515625, 0.44781494140625, 0.4936370849609375, 0.539459228515625, 0.5852813720703125, 0.631103515625, 0.6769256591796875, 0.722747802734375, 0.7685699462890625, 0.81439208984375, 0.8602142333984375, 0.906036376953125, 0.9518585205078125, 0.9976806640625, 1.0435028076171875, 1.089324951171875, 1.1351470947265625, 1.18096923828125, 1.2267913818359375, 1.272613525390625, 1.3184356689453125, 1.3642578125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 19.0, 30.0, 55.0, 64.0, 81.0, 127.0, 141.0, 127.0, 101.0, 74.0, 54.0, 26.0, 15.0, 27.0, 10.0, 5.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006537437438964844, -0.0006364211440086365, -0.0006190985441207886, -0.0006017759442329407, -0.0005844533443450928, -0.0005671307444572449, -0.000549808144569397, -0.0005324855446815491, -0.0005151629447937012, -0.0004978403449058533, -0.00048051774501800537, -0.00046319514513015747, -0.00044587254524230957, -0.00042854994535446167, -0.00041122734546661377, -0.00039390474557876587, -0.00037658214569091797, -0.00035925954580307007, -0.00034193694591522217, -0.00032461434602737427, -0.00030729174613952637, -0.00028996914625167847, -0.00027264654636383057, -0.00025532394647598267, -0.00023800134658813477, -0.00022067874670028687, -0.00020335614681243896, -0.00018603354692459106, -0.00016871094703674316, -0.00015138834714889526, -0.00013406574726104736, -0.00011674314737319946, -9.942054748535156e-05, -8.209794759750366e-05, -6.477534770965576e-05, -4.745274782180786e-05, -3.013014793395996e-05, -1.280754804611206e-05, 4.51505184173584e-06, 2.183765172958374e-05, 3.916025161743164e-05, 5.648285150527954e-05, 7.380545139312744e-05, 9.112805128097534e-05, 0.00010845065116882324, 0.00012577325105667114, 0.00014309585094451904, 0.00016041845083236694, 0.00017774105072021484, 0.00019506365060806274, 0.00021238625049591064, 0.00022970885038375854, 0.00024703145027160645, 0.00026435405015945435, 0.00028167665004730225, 0.00029899924993515015, 0.00031632184982299805, 0.00033364444971084595, 0.00035096704959869385, 0.00036828964948654175, 0.00038561224937438965, 0.00040293484926223755, 0.00042025744915008545, 0.00043758004903793335, 0.00045490264892578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 5.0, 6.0, 14.0, 14.0, 30.0, 31.0, 66.0, 112.0, 158.0, 298.0, 595.0, 1275.0, 3269.0, 9693.0, 39545.0, 232161.0, 640944.0, 91980.0, 19020.0, 5508.0, 1997.0, 846.0, 415.0, 223.0, 131.0, 77.0, 51.0, 34.0, 23.0, 10.0, 9.0, 6.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6494140625, -1.606292724609375, -1.56317138671875, -1.520050048828125, -1.4769287109375, -1.433807373046875, -1.39068603515625, -1.347564697265625, -1.304443359375, -1.261322021484375, -1.21820068359375, -1.175079345703125, -1.1319580078125, -1.088836669921875, -1.04571533203125, -1.002593994140625, -0.95947265625, -0.916351318359375, -0.87322998046875, -0.830108642578125, -0.7869873046875, -0.743865966796875, -0.70074462890625, -0.657623291015625, -0.614501953125, -0.571380615234375, -0.52825927734375, -0.485137939453125, -0.4420166015625, -0.398895263671875, -0.35577392578125, -0.312652587890625, -0.26953125, -0.226409912109375, -0.18328857421875, -0.140167236328125, -0.0970458984375, -0.053924560546875, -0.01080322265625, 0.032318115234375, 0.075439453125, 0.118560791015625, 0.16168212890625, 0.204803466796875, 0.2479248046875, 0.291046142578125, 0.33416748046875, 0.377288818359375, 0.42041015625, 0.463531494140625, 0.50665283203125, 0.549774169921875, 0.5928955078125, 0.636016845703125, 0.67913818359375, 0.722259521484375, 0.765380859375, 0.808502197265625, 0.85162353515625, 0.894744873046875, 0.9378662109375, 0.980987548828125, 1.02410888671875, 1.067230224609375, 1.1103515625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 7.0, 3.0, 7.0, 5.0, 9.0, 4.0, 7.0, 13.0, 15.0, 12.0, 23.0, 18.0, 35.0, 39.0, 52.0, 57.0, 46.0, 73.0, 81.0, 68.0, 76.0, 63.0, 58.0, 52.0, 48.0, 24.0, 12.0, 15.0, 19.0, 17.0, 15.0, 10.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.125, -1.0911407470703125, -1.057281494140625, -1.0234222412109375, -0.98956298828125, -0.9557037353515625, -0.921844482421875, -0.8879852294921875, -0.8541259765625, -0.8202667236328125, -0.786407470703125, -0.7525482177734375, -0.71868896484375, -0.6848297119140625, -0.650970458984375, -0.6171112060546875, -0.583251953125, -0.5493927001953125, -0.515533447265625, -0.4816741943359375, -0.44781494140625, -0.4139556884765625, -0.380096435546875, -0.3462371826171875, -0.3123779296875, -0.2785186767578125, -0.244659423828125, -0.2108001708984375, -0.17694091796875, -0.1430816650390625, -0.109222412109375, -0.0753631591796875, -0.04150390625, -0.0076446533203125, 0.026214599609375, 0.0600738525390625, 0.09393310546875, 0.1277923583984375, 0.161651611328125, 0.1955108642578125, 0.2293701171875, 0.2632293701171875, 0.297088623046875, 0.3309478759765625, 0.36480712890625, 0.3986663818359375, 0.432525634765625, 0.4663848876953125, 0.500244140625, 0.5341033935546875, 0.567962646484375, 0.6018218994140625, 0.63568115234375, 0.6695404052734375, 0.703399658203125, 0.7372589111328125, 0.7711181640625, 0.8049774169921875, 0.838836669921875, 0.8726959228515625, 0.90655517578125, 0.9404144287109375, 0.974273681640625, 1.0081329345703125, 1.0419921875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 15.0, 19.0, 49.0, 81.0, 141.0, 306.0, 190.0, 90.0, 46.0, 21.0, 21.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.15484046936035, -19.0116024017334, -17.868366241455078, -16.725128173828125, -15.581890106201172, -14.438652038574219, -13.295414924621582, -12.152177810668945, -11.008939743041992, -9.865701675415039, -8.722464561462402, -7.579226970672607, -6.4359893798828125, -5.292751789093018, -4.149514198303223, -3.006277084350586, -1.8630390167236328, -0.7198014259338379, 0.42343616485595703, 1.566673755645752, 2.709911346435547, 3.853148937225342, 4.996386528015137, 6.139623641967773, 7.282861709594727, 8.42609977722168, 9.569336891174316, 10.712574005126953, 11.855812072753906, 12.99905014038086, 14.142287254333496, 15.285524368286133, 16.428760528564453, 17.571998596191406, 18.71523666381836, 19.85847282409668, 21.001710891723633, 22.144948959350586, 23.288185119628906, 24.43142318725586, 25.574661254882812, 26.717899322509766, 27.86113739013672, 29.00437355041504, 30.147611618041992, 31.290849685668945, 32.434085845947266, 33.57732391357422, 34.72056198120117, 35.863800048828125, 37.00703811645508, 38.15027618408203, 39.29351043701172, 40.43674850463867, 41.579986572265625, 42.72322463989258, 43.86646270751953, 45.009700775146484, 46.15293884277344, 47.29617691040039, 48.439414978027344, 49.58264923095703, 50.725887298583984, 51.86912536621094, 53.01236343383789]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 7.0, 5.0, 9.0, 24.0, 10.0, 11.0, 11.0, 20.0, 19.0, 30.0, 31.0, 23.0, 25.0, 34.0, 36.0, 47.0, 53.0, 87.0, 81.0, 55.0, 54.0, 40.0, 35.0, 28.0, 30.0, 21.0, 24.0, 20.0, 24.0, 20.0, 19.0, 10.0, 12.0, 10.0, 4.0, 6.0, 5.0, 7.0, 5.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.79754638671875, -21.118200302124023, -20.438852310180664, -19.759506225585938, -19.08016014099121, -18.400814056396484, -17.721466064453125, -17.0421199798584, -16.362773895263672, -15.683426856994629, -15.004080772399902, -14.32473373413086, -13.645387649536133, -12.96604061126709, -12.286693572998047, -11.60734748840332, -10.927999496459961, -10.248652458190918, -9.569306373596191, -8.889959335327148, -8.210613250732422, -7.531266212463379, -6.851919174194336, -6.172572612762451, -5.493226051330566, -4.813879489898682, -4.134532928466797, -3.455185890197754, -2.775839328765869, -2.0964927673339844, -1.4171457290649414, -0.7377991676330566, -0.05845069885253906, 0.6208959817886353, 1.3002426624298096, 1.9795894622802734, 2.658936023712158, 3.338282585144043, 4.017629623413086, 4.696976184844971, 5.3763227462768555, 6.05566930770874, 6.735015869140625, 7.414362907409668, 8.093709945678711, 8.773056030273438, 9.45240306854248, 10.131750106811523, 10.81109619140625, 11.490443229675293, 12.16978931427002, 12.849136352539062, 13.528482437133789, 14.207829475402832, 14.887176513671875, 15.566522598266602, 16.245868682861328, 16.925214767456055, 17.604562759399414, 18.28390884399414, 18.963254928588867, 19.642601013183594, 20.321949005126953, 21.00129508972168, 21.68064308166504]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 5.0, 11.0, 21.0, 33.0, 53.0, 70.0, 120.0, 198.0, 348.0, 731.0, 1587.0, 3925.0, 11863.0, 59274.0, 438781.0, 2204833.0, 1267269.0, 168274.0, 25372.0, 6727.0, 2478.0, 1087.0, 547.0, 270.0, 156.0, 99.0, 52.0, 38.0, 23.0, 18.0, 14.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7477264404296875, -1.692718505859375, -1.6377105712890625, -1.58270263671875, -1.5276947021484375, -1.472686767578125, -1.4176788330078125, -1.3626708984375, -1.3076629638671875, -1.252655029296875, -1.1976470947265625, -1.14263916015625, -1.0876312255859375, -1.032623291015625, -0.9776153564453125, -0.922607421875, -0.8675994873046875, -0.812591552734375, -0.7575836181640625, -0.70257568359375, -0.6475677490234375, -0.592559814453125, -0.5375518798828125, -0.4825439453125, -0.4275360107421875, -0.372528076171875, -0.3175201416015625, -0.26251220703125, -0.2075042724609375, -0.152496337890625, -0.0974884033203125, -0.04248046875, 0.0125274658203125, 0.067535400390625, 0.1225433349609375, 0.17755126953125, 0.2325592041015625, 0.287567138671875, 0.3425750732421875, 0.3975830078125, 0.4525909423828125, 0.507598876953125, 0.5626068115234375, 0.61761474609375, 0.6726226806640625, 0.727630615234375, 0.7826385498046875, 0.837646484375, 0.8926544189453125, 0.947662353515625, 1.0026702880859375, 1.05767822265625, 1.1126861572265625, 1.167694091796875, 1.2227020263671875, 1.2777099609375, 1.3327178955078125, 1.387725830078125, 1.4427337646484375, 1.49774169921875, 1.5527496337890625, 1.607757568359375, 1.6627655029296875, 1.7177734375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 3.0, 7.0, 2.0, 9.0, 7.0, 6.0, 14.0, 13.0, 18.0, 17.0, 30.0, 23.0, 35.0, 33.0, 27.0, 32.0, 24.0, 28.0, 40.0, 34.0, 50.0, 43.0, 52.0, 42.0, 44.0, 34.0, 49.0, 32.0, 28.0, 27.0, 32.0, 17.0, 14.0, 22.0, 17.0, 17.0, 14.0, 15.0, 10.0, 8.0, 7.0, 5.0, 4.0, 0.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1171875, -1.079681396484375, -1.04217529296875, -1.004669189453125, -0.9671630859375, -0.929656982421875, -0.89215087890625, -0.854644775390625, -0.817138671875, -0.779632568359375, -0.74212646484375, -0.704620361328125, -0.6671142578125, -0.629608154296875, -0.59210205078125, -0.554595947265625, -0.51708984375, -0.479583740234375, -0.44207763671875, -0.404571533203125, -0.3670654296875, -0.329559326171875, -0.29205322265625, -0.254547119140625, -0.217041015625, -0.179534912109375, -0.14202880859375, -0.104522705078125, -0.0670166015625, -0.029510498046875, 0.00799560546875, 0.045501708984375, 0.0830078125, 0.120513916015625, 0.15802001953125, 0.195526123046875, 0.2330322265625, 0.270538330078125, 0.30804443359375, 0.345550537109375, 0.383056640625, 0.420562744140625, 0.45806884765625, 0.495574951171875, 0.5330810546875, 0.570587158203125, 0.60809326171875, 0.645599365234375, 0.68310546875, 0.720611572265625, 0.75811767578125, 0.795623779296875, 0.8331298828125, 0.870635986328125, 0.90814208984375, 0.945648193359375, 0.983154296875, 1.020660400390625, 1.05816650390625, 1.095672607421875, 1.1331787109375, 1.170684814453125, 1.20819091796875, 1.245697021484375, 1.283203125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 1.0, 6.0, 7.0, 7.0, 15.0, 9.0, 15.0, 26.0, 39.0, 108.0, 229.0, 666.0, 2221.0, 11322.0, 260983.0, 3843894.0, 66548.0, 6068.0, 1296.0, 440.0, 153.0, 79.0, 45.0, 24.0, 14.0, 12.0, 8.0, 11.0, 8.0, 4.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.92578125, -5.7626953125, -5.599609375, -5.4365234375, -5.2734375, -5.1103515625, -4.947265625, -4.7841796875, -4.62109375, -4.4580078125, -4.294921875, -4.1318359375, -3.96875, -3.8056640625, -3.642578125, -3.4794921875, -3.31640625, -3.1533203125, -2.990234375, -2.8271484375, -2.6640625, -2.5009765625, -2.337890625, -2.1748046875, -2.01171875, -1.8486328125, -1.685546875, -1.5224609375, -1.359375, -1.1962890625, -1.033203125, -0.8701171875, -0.70703125, -0.5439453125, -0.380859375, -0.2177734375, -0.0546875, 0.1083984375, 0.271484375, 0.4345703125, 0.59765625, 0.7607421875, 0.923828125, 1.0869140625, 1.25, 1.4130859375, 1.576171875, 1.7392578125, 1.90234375, 2.0654296875, 2.228515625, 2.3916015625, 2.5546875, 2.7177734375, 2.880859375, 3.0439453125, 3.20703125, 3.3701171875, 3.533203125, 3.6962890625, 3.859375, 4.0224609375, 4.185546875, 4.3486328125, 4.51171875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 8.0, 7.0, 16.0, 13.0, 20.0, 30.0, 60.0, 107.0, 213.0, 370.0, 655.0, 900.0, 734.0, 411.0, 217.0, 111.0, 72.0, 49.0, 23.0, 19.0, 10.0, 9.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.892578125, -3.773284912109375, -3.65399169921875, -3.534698486328125, -3.4154052734375, -3.296112060546875, -3.17681884765625, -3.057525634765625, -2.938232421875, -2.818939208984375, -2.69964599609375, -2.580352783203125, -2.4610595703125, -2.341766357421875, -2.22247314453125, -2.103179931640625, -1.98388671875, -1.864593505859375, -1.74530029296875, -1.626007080078125, -1.5067138671875, -1.387420654296875, -1.26812744140625, -1.148834228515625, -1.029541015625, -0.910247802734375, -0.79095458984375, -0.671661376953125, -0.5523681640625, -0.433074951171875, -0.31378173828125, -0.194488525390625, -0.0751953125, 0.044097900390625, 0.16339111328125, 0.282684326171875, 0.4019775390625, 0.521270751953125, 0.64056396484375, 0.759857177734375, 0.879150390625, 0.998443603515625, 1.11773681640625, 1.237030029296875, 1.3563232421875, 1.475616455078125, 1.59490966796875, 1.714202880859375, 1.83349609375, 1.952789306640625, 2.07208251953125, 2.191375732421875, 2.3106689453125, 2.429962158203125, 2.54925537109375, 2.668548583984375, 2.787841796875, 2.907135009765625, 3.02642822265625, 3.145721435546875, 3.2650146484375, 3.384307861328125, 3.50360107421875, 3.622894287109375, 3.7421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 4.0, 12.0, 16.0, 49.0, 93.0, 168.0, 211.0, 217.0, 136.0, 53.0, 24.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.830060958862305, -20.823678970336914, -19.81729507446289, -18.8109130859375, -17.80453109741211, -16.798147201538086, -15.791765213012695, -14.785382270812988, -13.778999328613281, -12.772616386413574, -11.766233444213867, -10.759851455688477, -9.75346851348877, -8.747085571289062, -7.740703105926514, -6.734320640563965, -5.727937698364258, -4.721554756164551, -3.715172290802002, -2.708789587020874, -1.702406883239746, -0.6960239410400391, 0.31035852432250977, 1.3167409896850586, 2.3231239318847656, 3.3295066356658936, 4.3358893394470215, 5.34227180480957, 6.348654747009277, 7.355037689208984, 8.361419677734375, 9.367802619934082, 10.374187469482422, 11.380570411682129, 12.386953353881836, 13.393335342407227, 14.399718284606934, 15.40610122680664, 16.41248321533203, 17.418865203857422, 18.425249099731445, 19.431631088256836, 20.43801498413086, 21.44439697265625, 22.45077896118164, 23.457162857055664, 24.463544845581055, 25.469928741455078, 26.47631072998047, 27.48269271850586, 28.489076614379883, 29.495458602905273, 30.501842498779297, 31.508224487304688, 32.51460647583008, 33.52098846435547, 34.527374267578125, 35.533756256103516, 36.540138244628906, 37.54652404785156, 38.55290603637695, 39.559288024902344, 40.565670013427734, 41.572052001953125, 42.578433990478516]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 7.0, 4.0, 12.0, 8.0, 12.0, 28.0, 35.0, 48.0, 50.0, 65.0, 80.0, 68.0, 70.0, 68.0, 67.0, 85.0, 63.0, 60.0, 32.0, 32.0, 31.0, 24.0, 20.0, 13.0, 11.0, 5.0, 4.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.095389366149902, -13.460210800170898, -12.825032234191895, -12.18985366821289, -11.55467414855957, -10.919495582580566, -10.284317016601562, -9.649137496948242, -9.013959884643555, -8.37878131866455, -7.743602275848389, -7.108423709869385, -6.473244667053223, -5.838066101074219, -5.202887535095215, -4.567708492279053, -3.9325294494628906, -3.2973506450653076, -2.6621718406677246, -2.0269932746887207, -1.3918144702911377, -0.7566356658935547, -0.12145709991455078, 0.5137219429016113, 1.1489005088806152, 1.7840793132781982, 2.4192581176757812, 3.054436683654785, 3.689615488052368, 4.324794292449951, 4.959972858428955, 5.595151901245117, 6.230329513549805, 6.865508079528809, 7.500687122344971, 8.135866165161133, 8.771044731140137, 9.40622329711914, 10.041401863098145, 10.676580429077148, 11.311759948730469, 11.946938514709473, 12.582117080688477, 13.217296600341797, 13.8524751663208, 14.487653732299805, 15.122832298278809, 15.758010864257812, 16.3931884765625, 17.02836799621582, 17.663545608520508, 18.298725128173828, 18.933902740478516, 19.569082260131836, 20.204261779785156, 20.839439392089844, 21.474618911743164, 22.109798431396484, 22.744976043701172, 23.380155563354492, 24.01533317565918, 24.6505126953125, 25.285690307617188, 25.920869827270508, 26.556049346923828]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 9.0, 14.0, 3.0, 8.0, 17.0, 21.0, 28.0, 49.0, 77.0, 121.0, 183.0, 352.0, 551.0, 1012.0, 1957.0, 3411.0, 6575.0, 12662.0, 24492.0, 47830.0, 92899.0, 173058.0, 248663.0, 200564.0, 113051.0, 58182.0, 30055.0, 15265.0, 8016.0, 4215.0, 2255.0, 1230.0, 739.0, 390.0, 219.0, 126.0, 96.0, 52.0, 38.0, 33.0, 14.0, 13.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2255859375, -1.1812591552734375, -1.136932373046875, -1.0926055908203125, -1.04827880859375, -1.0039520263671875, -0.959625244140625, -0.9152984619140625, -0.8709716796875, -0.8266448974609375, -0.782318115234375, -0.7379913330078125, -0.69366455078125, -0.6493377685546875, -0.605010986328125, -0.5606842041015625, -0.516357421875, -0.4720306396484375, -0.427703857421875, -0.3833770751953125, -0.33905029296875, -0.2947235107421875, -0.250396728515625, -0.2060699462890625, -0.1617431640625, -0.1174163818359375, -0.073089599609375, -0.0287628173828125, 0.01556396484375, 0.0598907470703125, 0.104217529296875, 0.1485443115234375, 0.19287109375, 0.2371978759765625, 0.281524658203125, 0.3258514404296875, 0.37017822265625, 0.4145050048828125, 0.458831787109375, 0.5031585693359375, 0.5474853515625, 0.5918121337890625, 0.636138916015625, 0.6804656982421875, 0.72479248046875, 0.7691192626953125, 0.813446044921875, 0.8577728271484375, 0.902099609375, 0.9464263916015625, 0.990753173828125, 1.0350799560546875, 1.07940673828125, 1.1237335205078125, 1.168060302734375, 1.2123870849609375, 1.2567138671875, 1.3010406494140625, 1.345367431640625, 1.3896942138671875, 1.43402099609375, 1.4783477783203125, 1.522674560546875, 1.5670013427734375, 1.611328125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 4.0, 6.0, 13.0, 9.0, 15.0, 23.0, 19.0, 22.0, 34.0, 31.0, 35.0, 32.0, 34.0, 27.0, 41.0, 37.0, 45.0, 45.0, 43.0, 48.0, 47.0, 53.0, 35.0, 35.0, 29.0, 24.0, 32.0, 27.0, 20.0, 25.0, 20.0, 18.0, 9.0, 12.0, 11.0, 4.0, 9.0, 4.0, 8.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.1307220458984375, -1.089569091796875, -1.0484161376953125, -1.00726318359375, -0.9661102294921875, -0.924957275390625, -0.8838043212890625, -0.8426513671875, -0.8014984130859375, -0.760345458984375, -0.7191925048828125, -0.67803955078125, -0.6368865966796875, -0.595733642578125, -0.5545806884765625, -0.513427734375, -0.4722747802734375, -0.431121826171875, -0.3899688720703125, -0.34881591796875, -0.3076629638671875, -0.266510009765625, -0.2253570556640625, -0.1842041015625, -0.1430511474609375, -0.101898193359375, -0.0607452392578125, -0.01959228515625, 0.0215606689453125, 0.062713623046875, 0.1038665771484375, 0.14501953125, 0.1861724853515625, 0.227325439453125, 0.2684783935546875, 0.30963134765625, 0.3507843017578125, 0.391937255859375, 0.4330902099609375, 0.4742431640625, 0.5153961181640625, 0.556549072265625, 0.5977020263671875, 0.63885498046875, 0.6800079345703125, 0.721160888671875, 0.7623138427734375, 0.803466796875, 0.8446197509765625, 0.885772705078125, 0.9269256591796875, 0.96807861328125, 1.0092315673828125, 1.050384521484375, 1.0915374755859375, 1.1326904296875, 1.1738433837890625, 1.214996337890625, 1.2561492919921875, 1.29730224609375, 1.3384552001953125, 1.379608154296875, 1.4207611083984375, 1.4619140625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 3.0, 5.0, 8.0, 10.0, 13.0, 20.0, 25.0, 35.0, 41.0, 78.0, 121.0, 138.0, 243.0, 396.0, 650.0, 1342.0, 3727.0, 17972.0, 141581.0, 747368.0, 113296.0, 15135.0, 3377.0, 1212.0, 610.0, 379.0, 243.0, 180.0, 111.0, 72.0, 51.0, 34.0, 30.0, 24.0, 7.0, 10.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.15234375, -5.0147705078125, -4.877197265625, -4.7396240234375, -4.60205078125, -4.4644775390625, -4.326904296875, -4.1893310546875, -4.0517578125, -3.9141845703125, -3.776611328125, -3.6390380859375, -3.50146484375, -3.3638916015625, -3.226318359375, -3.0887451171875, -2.951171875, -2.8135986328125, -2.676025390625, -2.5384521484375, -2.40087890625, -2.2633056640625, -2.125732421875, -1.9881591796875, -1.8505859375, -1.7130126953125, -1.575439453125, -1.4378662109375, -1.30029296875, -1.1627197265625, -1.025146484375, -0.8875732421875, -0.75, -0.6124267578125, -0.474853515625, -0.3372802734375, -0.19970703125, -0.0621337890625, 0.075439453125, 0.2130126953125, 0.3505859375, 0.4881591796875, 0.625732421875, 0.7633056640625, 0.90087890625, 1.0384521484375, 1.176025390625, 1.3135986328125, 1.451171875, 1.5887451171875, 1.726318359375, 1.8638916015625, 2.00146484375, 2.1390380859375, 2.276611328125, 2.4141845703125, 2.5517578125, 2.6893310546875, 2.826904296875, 2.9644775390625, 3.10205078125, 3.2396240234375, 3.377197265625, 3.5147705078125, 3.65234375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 11.0, 14.0, 16.0, 21.0, 21.0, 35.0, 34.0, 39.0, 48.0, 60.0, 66.0, 59.0, 68.0, 78.0, 64.0, 59.0, 42.0, 47.0, 37.0, 33.0, 30.0, 24.0, 21.0, 19.0, 10.0, 11.0, 4.0, 8.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.1328125, -6.92205810546875, -6.7113037109375, -6.50054931640625, -6.289794921875, -6.07904052734375, -5.8682861328125, -5.65753173828125, -5.44677734375, -5.23602294921875, -5.0252685546875, -4.81451416015625, -4.603759765625, -4.39300537109375, -4.1822509765625, -3.97149658203125, -3.7607421875, -3.54998779296875, -3.3392333984375, -3.12847900390625, -2.917724609375, -2.70697021484375, -2.4962158203125, -2.28546142578125, -2.07470703125, -1.86395263671875, -1.6531982421875, -1.44244384765625, -1.231689453125, -1.02093505859375, -0.8101806640625, -0.59942626953125, -0.388671875, -0.17791748046875, 0.0328369140625, 0.24359130859375, 0.454345703125, 0.66510009765625, 0.8758544921875, 1.08660888671875, 1.29736328125, 1.50811767578125, 1.7188720703125, 1.92962646484375, 2.140380859375, 2.35113525390625, 2.5618896484375, 2.77264404296875, 2.9833984375, 3.19415283203125, 3.4049072265625, 3.61566162109375, 3.826416015625, 4.03717041015625, 4.2479248046875, 4.45867919921875, 4.66943359375, 4.88018798828125, 5.0909423828125, 5.30169677734375, 5.512451171875, 5.72320556640625, 5.9339599609375, 6.14471435546875, 6.35546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 10.0, 7.0, 18.0, 15.0, 21.0, 31.0, 60.0, 76.0, 113.0, 180.0, 341.0, 606.0, 1124.0, 2449.0, 5798.0, 16334.0, 56330.0, 243994.0, 593961.0, 88731.0, 24102.0, 7938.0, 3175.0, 1391.0, 746.0, 362.0, 219.0, 106.0, 80.0, 61.0, 45.0, 36.0, 22.0, 12.0, 10.0, 15.0, 5.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.90185546875, -0.8698348999023438, -0.8378143310546875, -0.8057937622070312, -0.773773193359375, -0.7417526245117188, -0.7097320556640625, -0.6777114868164062, -0.64569091796875, -0.6136703491210938, -0.5816497802734375, -0.5496292114257812, -0.517608642578125, -0.48558807373046875, -0.4535675048828125, -0.42154693603515625, -0.3895263671875, -0.35750579833984375, -0.3254852294921875, -0.29346466064453125, -0.261444091796875, -0.22942352294921875, -0.1974029541015625, -0.16538238525390625, -0.13336181640625, -0.10134124755859375, -0.0693206787109375, -0.03730010986328125, -0.005279541015625, 0.02674102783203125, 0.0587615966796875, 0.09078216552734375, 0.122802734375, 0.15482330322265625, 0.1868438720703125, 0.21886444091796875, 0.250885009765625, 0.28290557861328125, 0.3149261474609375, 0.34694671630859375, 0.37896728515625, 0.41098785400390625, 0.4430084228515625, 0.47502899169921875, 0.507049560546875, 0.5390701293945312, 0.5710906982421875, 0.6031112670898438, 0.6351318359375, 0.6671524047851562, 0.6991729736328125, 0.7311935424804688, 0.763214111328125, 0.7952346801757812, 0.8272552490234375, 0.8592758178710938, 0.89129638671875, 0.9233169555664062, 0.9553375244140625, 0.9873580932617188, 1.019378662109375, 1.0513992309570312, 1.0834197998046875, 1.1154403686523438, 1.1474609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 10.0, 12.0, 8.0, 15.0, 32.0, 24.0, 31.0, 52.0, 55.0, 66.0, 102.0, 112.0, 126.0, 93.0, 63.0, 43.0, 36.0, 21.0, 21.0, 11.0, 21.0, 5.0, 8.0, 6.0, 3.0, 5.0, 3.0, 6.0, 2.0, 2.0, 1.0], "bins": [-0.0005640983581542969, -0.0005515515804290771, -0.0005390048027038574, -0.0005264580249786377, -0.000513911247253418, -0.0005013644695281982, -0.0004888176918029785, -0.0004762709140777588, -0.00046372413635253906, -0.00045117735862731934, -0.0004386305809020996, -0.0004260838031768799, -0.00041353702545166016, -0.00040099024772644043, -0.0003884434700012207, -0.000375896692276001, -0.00036334991455078125, -0.0003508031368255615, -0.0003382563591003418, -0.00032570958137512207, -0.00031316280364990234, -0.0003006160259246826, -0.0002880692481994629, -0.00027552247047424316, -0.00026297569274902344, -0.0002504289150238037, -0.00023788213729858398, -0.00022533535957336426, -0.00021278858184814453, -0.0002002418041229248, -0.00018769502639770508, -0.00017514824867248535, -0.00016260147094726562, -0.0001500546932220459, -0.00013750791549682617, -0.00012496113777160645, -0.00011241436004638672, -9.986758232116699e-05, -8.732080459594727e-05, -7.477402687072754e-05, -6.222724914550781e-05, -4.9680471420288086e-05, -3.713369369506836e-05, -2.4586915969848633e-05, -1.2040138244628906e-05, 5.066394805908203e-07, 1.3053417205810547e-05, 2.5600194931030273e-05, 3.814697265625e-05, 5.0693750381469727e-05, 6.324052810668945e-05, 7.578730583190918e-05, 8.83340835571289e-05, 0.00010088086128234863, 0.00011342763900756836, 0.00012597441673278809, 0.0001385211944580078, 0.00015106797218322754, 0.00016361474990844727, 0.000176161527633667, 0.00018870830535888672, 0.00020125508308410645, 0.00021380186080932617, 0.0002263486385345459, 0.00023889541625976562]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 8.0, 3.0, 4.0, 9.0, 13.0, 22.0, 41.0, 45.0, 80.0, 149.0, 264.0, 504.0, 1323.0, 3727.0, 14387.0, 82583.0, 716334.0, 191175.0, 28165.0, 6233.0, 1943.0, 732.0, 353.0, 172.0, 110.0, 54.0, 35.0, 28.0, 21.0, 13.0, 3.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748046875, -1.1308135986328125, -1.086822509765625, -1.0428314208984375, -0.99884033203125, -0.9548492431640625, -0.910858154296875, -0.8668670654296875, -0.8228759765625, -0.7788848876953125, -0.734893798828125, -0.6909027099609375, -0.64691162109375, -0.6029205322265625, -0.558929443359375, -0.5149383544921875, -0.470947265625, -0.4269561767578125, -0.382965087890625, -0.3389739990234375, -0.29498291015625, -0.2509918212890625, -0.207000732421875, -0.1630096435546875, -0.1190185546875, -0.0750274658203125, -0.031036376953125, 0.0129547119140625, 0.05694580078125, 0.1009368896484375, 0.144927978515625, 0.1889190673828125, 0.23291015625, 0.2769012451171875, 0.320892333984375, 0.3648834228515625, 0.40887451171875, 0.4528656005859375, 0.496856689453125, 0.5408477783203125, 0.5848388671875, 0.6288299560546875, 0.672821044921875, 0.7168121337890625, 0.76080322265625, 0.8047943115234375, 0.848785400390625, 0.8927764892578125, 0.936767578125, 0.9807586669921875, 1.024749755859375, 1.0687408447265625, 1.11273193359375, 1.1567230224609375, 1.200714111328125, 1.2447052001953125, 1.2886962890625, 1.3326873779296875, 1.376678466796875, 1.4206695556640625, 1.46466064453125, 1.5086517333984375, 1.552642822265625, 1.5966339111328125, 1.640625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 14.0, 7.0, 13.0, 14.0, 21.0, 34.0, 45.0, 46.0, 54.0, 76.0, 84.0, 97.0, 108.0, 90.0, 74.0, 50.0, 44.0, 37.0, 28.0, 13.0, 12.0, 10.0, 10.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3203125, -1.27972412109375, -1.2391357421875, -1.19854736328125, -1.157958984375, -1.11737060546875, -1.0767822265625, -1.03619384765625, -0.99560546875, -0.95501708984375, -0.9144287109375, -0.87384033203125, -0.833251953125, -0.79266357421875, -0.7520751953125, -0.71148681640625, -0.6708984375, -0.63031005859375, -0.5897216796875, -0.54913330078125, -0.508544921875, -0.46795654296875, -0.4273681640625, -0.38677978515625, -0.34619140625, -0.30560302734375, -0.2650146484375, -0.22442626953125, -0.183837890625, -0.14324951171875, -0.1026611328125, -0.06207275390625, -0.021484375, 0.01910400390625, 0.0596923828125, 0.10028076171875, 0.140869140625, 0.18145751953125, 0.2220458984375, 0.26263427734375, 0.30322265625, 0.34381103515625, 0.3843994140625, 0.42498779296875, 0.465576171875, 0.50616455078125, 0.5467529296875, 0.58734130859375, 0.6279296875, 0.66851806640625, 0.7091064453125, 0.74969482421875, 0.790283203125, 0.83087158203125, 0.8714599609375, 0.91204833984375, 0.95263671875, 0.99322509765625, 1.0338134765625, 1.07440185546875, 1.114990234375, 1.15557861328125, 1.1961669921875, 1.23675537109375, 1.27734375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 18.0, 43.0, 104.0, 220.0, 313.0, 155.0, 73.0, 38.0, 11.0, 11.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.646297454833984, -41.35685729980469, -40.067413330078125, -38.77796936035156, -37.488529205322266, -36.19908905029297, -34.909645080566406, -33.620201110839844, -32.33076095581055, -31.041318893432617, -29.751876831054688, -28.462434768676758, -27.172992706298828, -25.8835506439209, -24.59410858154297, -23.30466651916504, -22.01522445678711, -20.72578239440918, -19.43634033203125, -18.14689826965332, -16.85745620727539, -15.568014144897461, -14.278572082519531, -12.989130020141602, -11.699687957763672, -10.410245895385742, -9.120803833007812, -7.831361770629883, -6.541919708251953, -5.252477645874023, -3.9630355834960938, -2.673593521118164, -1.3841476440429688, -0.09470558166503906, 1.1947364807128906, 2.4841785430908203, 3.77362060546875, 5.06306266784668, 6.352504730224609, 7.641946792602539, 8.931388854980469, 10.220830917358398, 11.510272979736328, 12.799715042114258, 14.089157104492188, 15.378599166870117, 16.668041229248047, 17.957483291625977, 19.246925354003906, 20.536367416381836, 21.825809478759766, 23.115251541137695, 24.404693603515625, 25.694135665893555, 26.983577728271484, 28.273019790649414, 29.562461853027344, 30.851903915405273, 32.1413459777832, 33.4307861328125, 34.72023010253906, 36.009674072265625, 37.29911422729492, 38.58855438232422, 39.87799835205078]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 5.0, 4.0, 2.0, 9.0, 2.0, 6.0, 4.0, 10.0, 6.0, 11.0, 9.0, 13.0, 10.0, 19.0, 18.0, 23.0, 18.0, 26.0, 32.0, 31.0, 45.0, 55.0, 78.0, 105.0, 104.0, 50.0, 36.0, 27.0, 34.0, 25.0, 33.0, 20.0, 18.0, 18.0, 10.0, 20.0, 18.0, 13.0, 14.0, 4.0, 8.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.231552124023438, -20.5985107421875, -19.965469360351562, -19.332427978515625, -18.699386596679688, -18.06634521484375, -17.433303833007812, -16.800262451171875, -16.167221069335938, -15.5341796875, -14.901138305664062, -14.268096923828125, -13.635055541992188, -13.00201416015625, -12.368972778320312, -11.735931396484375, -11.102890014648438, -10.4698486328125, -9.836807250976562, -9.203765869140625, -8.570724487304688, -7.93768310546875, -7.3046417236328125, -6.671600341796875, -6.0385589599609375, -5.405517578125, -4.7724761962890625, -4.139434814453125, -3.5063934326171875, -2.87335205078125, -2.2403106689453125, -1.607269287109375, -0.9742279052734375, -0.3411865234375, 0.2918548583984375, 0.924896240234375, 1.5579376220703125, 2.19097900390625, 2.8240203857421875, 3.457061767578125, 4.0901031494140625, 4.72314453125, 5.3561859130859375, 5.989227294921875, 6.6222686767578125, 7.25531005859375, 7.8883514404296875, 8.521392822265625, 9.154434204101562, 9.7874755859375, 10.420516967773438, 11.053558349609375, 11.686599731445312, 12.31964111328125, 12.952682495117188, 13.585723876953125, 14.218765258789062, 14.851806640625, 15.484848022460938, 16.117889404296875, 16.750930786132812, 17.38397216796875, 18.017013549804688, 18.650054931640625, 19.283096313476562]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 6.0, 6.0, 5.0, 13.0, 16.0, 5.0, 14.0, 29.0, 47.0, 44.0, 69.0, 98.0, 165.0, 221.0, 426.0, 816.0, 1606.0, 3462.0, 9385.0, 37557.0, 270114.0, 1809496.0, 1744136.0, 262132.0, 37663.0, 9685.0, 3604.0, 1562.0, 800.0, 408.0, 237.0, 131.0, 85.0, 61.0, 53.0, 27.0, 20.0, 13.0, 17.0, 17.0, 15.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0, -1.9393768310546875, -1.878753662109375, -1.8181304931640625, -1.75750732421875, -1.6968841552734375, -1.636260986328125, -1.5756378173828125, -1.5150146484375, -1.4543914794921875, -1.393768310546875, -1.3331451416015625, -1.27252197265625, -1.2118988037109375, -1.151275634765625, -1.0906524658203125, -1.030029296875, -0.9694061279296875, -0.908782958984375, -0.8481597900390625, -0.78753662109375, -0.7269134521484375, -0.666290283203125, -0.6056671142578125, -0.5450439453125, -0.4844207763671875, -0.423797607421875, -0.3631744384765625, -0.30255126953125, -0.2419281005859375, -0.181304931640625, -0.1206817626953125, -0.06005859375, 0.0005645751953125, 0.061187744140625, 0.1218109130859375, 0.18243408203125, 0.2430572509765625, 0.303680419921875, 0.3643035888671875, 0.4249267578125, 0.4855499267578125, 0.546173095703125, 0.6067962646484375, 0.66741943359375, 0.7280426025390625, 0.788665771484375, 0.8492889404296875, 0.909912109375, 0.9705352783203125, 1.031158447265625, 1.0917816162109375, 1.15240478515625, 1.2130279541015625, 1.273651123046875, 1.3342742919921875, 1.3948974609375, 1.4555206298828125, 1.516143798828125, 1.5767669677734375, 1.63739013671875, 1.6980133056640625, 1.758636474609375, 1.8192596435546875, 1.8798828125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 8.0, 9.0, 14.0, 14.0, 30.0, 26.0, 22.0, 25.0, 32.0, 30.0, 46.0, 47.0, 50.0, 45.0, 61.0, 58.0, 60.0, 61.0, 41.0, 46.0, 45.0, 48.0, 36.0, 24.0, 26.0, 24.0, 18.0, 11.0, 11.0, 11.0, 11.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8720703125, -1.8221588134765625, -1.772247314453125, -1.7223358154296875, -1.67242431640625, -1.6225128173828125, -1.572601318359375, -1.5226898193359375, -1.4727783203125, -1.4228668212890625, -1.372955322265625, -1.3230438232421875, -1.27313232421875, -1.2232208251953125, -1.173309326171875, -1.1233978271484375, -1.073486328125, -1.0235748291015625, -0.973663330078125, -0.9237518310546875, -0.87384033203125, -0.8239288330078125, -0.774017333984375, -0.7241058349609375, -0.6741943359375, -0.6242828369140625, -0.574371337890625, -0.5244598388671875, -0.47454833984375, -0.4246368408203125, -0.374725341796875, -0.3248138427734375, -0.27490234375, -0.2249908447265625, -0.175079345703125, -0.1251678466796875, -0.07525634765625, -0.0253448486328125, 0.024566650390625, 0.0744781494140625, 0.1243896484375, 0.1743011474609375, 0.224212646484375, 0.2741241455078125, 0.32403564453125, 0.3739471435546875, 0.423858642578125, 0.4737701416015625, 0.523681640625, 0.5735931396484375, 0.623504638671875, 0.6734161376953125, 0.72332763671875, 0.7732391357421875, 0.823150634765625, 0.8730621337890625, 0.9229736328125, 0.9728851318359375, 1.022796630859375, 1.0727081298828125, 1.12261962890625, 1.1725311279296875, 1.222442626953125, 1.2723541259765625, 1.322265625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 7.0, 14.0, 25.0, 32.0, 75.0, 136.0, 328.0, 903.0, 6376.0, 937968.0, 3236815.0, 10003.0, 1038.0, 271.0, 141.0, 70.0, 31.0, 23.0, 7.0, 7.0, 5.0, 5.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.2734375, -9.0013427734375, -8.729248046875, -8.4571533203125, -8.18505859375, -7.9129638671875, -7.640869140625, -7.3687744140625, -7.0966796875, -6.8245849609375, -6.552490234375, -6.2803955078125, -6.00830078125, -5.7362060546875, -5.464111328125, -5.1920166015625, -4.919921875, -4.6478271484375, -4.375732421875, -4.1036376953125, -3.83154296875, -3.5594482421875, -3.287353515625, -3.0152587890625, -2.7431640625, -2.4710693359375, -2.198974609375, -1.9268798828125, -1.65478515625, -1.3826904296875, -1.110595703125, -0.8385009765625, -0.56640625, -0.2943115234375, -0.022216796875, 0.2498779296875, 0.52197265625, 0.7940673828125, 1.066162109375, 1.3382568359375, 1.6103515625, 1.8824462890625, 2.154541015625, 2.4266357421875, 2.69873046875, 2.9708251953125, 3.242919921875, 3.5150146484375, 3.787109375, 4.0592041015625, 4.331298828125, 4.6033935546875, 4.87548828125, 5.1475830078125, 5.419677734375, 5.6917724609375, 5.9638671875, 6.2359619140625, 6.508056640625, 6.7801513671875, 7.05224609375, 7.3243408203125, 7.596435546875, 7.8685302734375, 8.140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 4.0, 3.0, 6.0, 3.0, 8.0, 7.0, 15.0, 19.0, 29.0, 43.0, 66.0, 80.0, 138.0, 265.0, 391.0, 642.0, 743.0, 597.0, 402.0, 249.0, 139.0, 82.0, 51.0, 27.0, 19.0, 12.0, 13.0, 5.0, 7.0, 3.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-5.04296875, -4.92694091796875, -4.8109130859375, -4.69488525390625, -4.578857421875, -4.46282958984375, -4.3468017578125, -4.23077392578125, -4.11474609375, -3.99871826171875, -3.8826904296875, -3.76666259765625, -3.650634765625, -3.53460693359375, -3.4185791015625, -3.30255126953125, -3.1865234375, -3.07049560546875, -2.9544677734375, -2.83843994140625, -2.722412109375, -2.60638427734375, -2.4903564453125, -2.37432861328125, -2.25830078125, -2.14227294921875, -2.0262451171875, -1.91021728515625, -1.794189453125, -1.67816162109375, -1.5621337890625, -1.44610595703125, -1.330078125, -1.21405029296875, -1.0980224609375, -0.98199462890625, -0.865966796875, -0.74993896484375, -0.6339111328125, -0.51788330078125, -0.40185546875, -0.28582763671875, -0.1697998046875, -0.05377197265625, 0.062255859375, 0.17828369140625, 0.2943115234375, 0.41033935546875, 0.5263671875, 0.64239501953125, 0.7584228515625, 0.87445068359375, 0.990478515625, 1.10650634765625, 1.2225341796875, 1.33856201171875, 1.45458984375, 1.57061767578125, 1.6866455078125, 1.80267333984375, 1.918701171875, 2.03472900390625, 2.1507568359375, 2.26678466796875, 2.3828125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 3.0, 2.0, 2.0, 6.0, 9.0, 13.0, 13.0, 26.0, 47.0, 78.0, 137.0, 174.0, 193.0, 138.0, 74.0, 41.0, 28.0, 10.0, 7.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-48.44757843017578, -47.46179962158203, -46.47602081298828, -45.49024200439453, -44.50446319580078, -43.51868438720703, -42.53290557861328, -41.547122955322266, -40.561344146728516, -39.575565338134766, -38.589786529541016, -37.604007720947266, -36.618228912353516, -35.6324462890625, -34.64666748046875, -33.660888671875, -32.67510986328125, -31.6893310546875, -30.70355224609375, -29.7177734375, -28.731992721557617, -27.746213912963867, -26.760435104370117, -25.774656295776367, -24.78887939453125, -23.8031005859375, -22.81732177734375, -21.83154296875, -20.845762252807617, -19.859983444213867, -18.874204635620117, -17.888425827026367, -16.902647018432617, -15.916868209838867, -14.9310884475708, -13.94530963897705, -12.959529876708984, -11.973751068115234, -10.987972259521484, -10.002193450927734, -9.016413688659668, -8.030634880065918, -7.044855117797852, -6.059076309204102, -5.073297023773193, -4.087517738342285, -3.101738929748535, -2.115959644317627, -1.1301803588867188, -0.1444011926651001, 0.8413779735565186, 1.8271570205688477, 2.812936305999756, 3.798715591430664, 4.784494400024414, 5.770273685455322, 6.7560529708862305, 7.741832256317139, 8.727611541748047, 9.713390350341797, 10.699169158935547, 11.684948921203613, 12.670727729797363, 13.65650749206543, 14.64228630065918]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 7.0, 5.0, 5.0, 7.0, 10.0, 11.0, 12.0, 21.0, 23.0, 26.0, 32.0, 24.0, 50.0, 29.0, 45.0, 53.0, 46.0, 56.0, 41.0, 40.0, 61.0, 39.0, 46.0, 44.0, 32.0, 40.0, 33.0, 26.0, 24.0, 18.0, 19.0, 16.0, 8.0, 11.0, 12.0, 8.0, 4.0, 0.0, 7.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-17.362857818603516, -16.822925567626953, -16.28299331665039, -15.743061065673828, -15.203128814697266, -14.663196563720703, -14.123263359069824, -13.583331108093262, -13.0433988571167, -12.503466606140137, -11.963534355163574, -11.423602104187012, -10.883668899536133, -10.34373664855957, -9.803804397583008, -9.263872146606445, -8.723939895629883, -8.18400764465332, -7.644075393676758, -7.104142665863037, -6.564210414886475, -6.024278163909912, -5.484345436096191, -4.944413185119629, -4.404480934143066, -3.864548683166504, -3.3246161937713623, -2.7846837043762207, -2.244751453399658, -1.7048192024230957, -1.164886713027954, -0.6249542236328125, -0.08502388000488281, 0.45490849018096924, 0.9948408603668213, 1.5347732305526733, 2.0747056007385254, 2.614637851715088, 3.1545703411102295, 3.694502830505371, 4.234435081481934, 4.774367332458496, 5.314299583435059, 5.854232311248779, 6.394164562225342, 6.934096813201904, 7.474029541015625, 8.013961791992188, 8.55389404296875, 9.093826293945312, 9.633758544921875, 10.173690795898438, 10.713623046875, 11.253555297851562, 11.793488502502441, 12.333420753479004, 12.873353004455566, 13.413285255432129, 13.953217506408691, 14.493149757385254, 15.033082962036133, 15.573015213012695, 16.112947463989258, 16.65287971496582, 17.192811965942383]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 5.0, 5.0, 5.0, 4.0, 10.0, 21.0, 24.0, 24.0, 38.0, 59.0, 61.0, 122.0, 138.0, 220.0, 327.0, 472.0, 681.0, 979.0, 1429.0, 2146.0, 3296.0, 4994.0, 8002.0, 12576.0, 20691.0, 35469.0, 61620.0, 109259.0, 184843.0, 224121.0, 157446.0, 90629.0, 51097.0, 29498.0, 17738.0, 10690.0, 6715.0, 4404.0, 2742.0, 1889.0, 1290.0, 839.0, 586.0, 403.0, 287.0, 198.0, 150.0, 102.0, 64.0, 52.0, 34.0, 19.0, 16.0, 8.0, 8.0, 13.0, 4.0, 1.0, 2.0, 4.0, 2.0], "bins": [-1.373046875, -1.3305816650390625, -1.288116455078125, -1.2456512451171875, -1.20318603515625, -1.1607208251953125, -1.118255615234375, -1.0757904052734375, -1.0333251953125, -0.9908599853515625, -0.948394775390625, -0.9059295654296875, -0.86346435546875, -0.8209991455078125, -0.778533935546875, -0.7360687255859375, -0.693603515625, -0.6511383056640625, -0.608673095703125, -0.5662078857421875, -0.52374267578125, -0.4812774658203125, -0.438812255859375, -0.3963470458984375, -0.3538818359375, -0.3114166259765625, -0.268951416015625, -0.2264862060546875, -0.18402099609375, -0.1415557861328125, -0.099090576171875, -0.0566253662109375, -0.01416015625, 0.0283050537109375, 0.070770263671875, 0.1132354736328125, 0.15570068359375, 0.1981658935546875, 0.240631103515625, 0.2830963134765625, 0.3255615234375, 0.3680267333984375, 0.410491943359375, 0.4529571533203125, 0.49542236328125, 0.5378875732421875, 0.580352783203125, 0.6228179931640625, 0.665283203125, 0.7077484130859375, 0.750213623046875, 0.7926788330078125, 0.83514404296875, 0.8776092529296875, 0.920074462890625, 0.9625396728515625, 1.0050048828125, 1.0474700927734375, 1.089935302734375, 1.1324005126953125, 1.17486572265625, 1.2173309326171875, 1.259796142578125, 1.3022613525390625, 1.3447265625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 0.0, 4.0, 3.0, 3.0, 8.0, 8.0, 7.0, 10.0, 17.0, 24.0, 27.0, 16.0, 29.0, 32.0, 29.0, 31.0, 46.0, 41.0, 44.0, 40.0, 49.0, 55.0, 48.0, 50.0, 44.0, 45.0, 54.0, 34.0, 34.0, 31.0, 27.0, 16.0, 19.0, 15.0, 11.0, 12.0, 12.0, 7.0, 5.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6533203125, -1.6055145263671875, -1.557708740234375, -1.5099029541015625, -1.46209716796875, -1.4142913818359375, -1.366485595703125, -1.3186798095703125, -1.2708740234375, -1.2230682373046875, -1.175262451171875, -1.1274566650390625, -1.07965087890625, -1.0318450927734375, -0.984039306640625, -0.9362335205078125, -0.888427734375, -0.8406219482421875, -0.792816162109375, -0.7450103759765625, -0.69720458984375, -0.6493988037109375, -0.601593017578125, -0.5537872314453125, -0.5059814453125, -0.4581756591796875, -0.410369873046875, -0.3625640869140625, -0.31475830078125, -0.2669525146484375, -0.219146728515625, -0.1713409423828125, -0.12353515625, -0.0757293701171875, -0.027923583984375, 0.0198822021484375, 0.06768798828125, 0.1154937744140625, 0.163299560546875, 0.2111053466796875, 0.2589111328125, 0.3067169189453125, 0.354522705078125, 0.4023284912109375, 0.45013427734375, 0.4979400634765625, 0.545745849609375, 0.5935516357421875, 0.641357421875, 0.6891632080078125, 0.736968994140625, 0.7847747802734375, 0.83258056640625, 0.8803863525390625, 0.928192138671875, 0.9759979248046875, 1.0238037109375, 1.0716094970703125, 1.119415283203125, 1.1672210693359375, 1.21502685546875, 1.2628326416015625, 1.310638427734375, 1.3584442138671875, 1.40625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 4.0, 6.0, 4.0, 7.0, 11.0, 17.0, 23.0, 42.0, 74.0, 118.0, 177.0, 267.0, 458.0, 955.0, 2493.0, 13356.0, 331991.0, 677685.0, 15880.0, 2765.0, 1006.0, 449.0, 306.0, 158.0, 105.0, 75.0, 42.0, 28.0, 22.0, 12.0, 5.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.7421875, -6.4927978515625, -6.243408203125, -5.9940185546875, -5.74462890625, -5.4952392578125, -5.245849609375, -4.9964599609375, -4.7470703125, -4.4976806640625, -4.248291015625, -3.9989013671875, -3.74951171875, -3.5001220703125, -3.250732421875, -3.0013427734375, -2.751953125, -2.5025634765625, -2.253173828125, -2.0037841796875, -1.75439453125, -1.5050048828125, -1.255615234375, -1.0062255859375, -0.7568359375, -0.5074462890625, -0.258056640625, -0.0086669921875, 0.24072265625, 0.4901123046875, 0.739501953125, 0.9888916015625, 1.23828125, 1.4876708984375, 1.737060546875, 1.9864501953125, 2.23583984375, 2.4852294921875, 2.734619140625, 2.9840087890625, 3.2333984375, 3.4827880859375, 3.732177734375, 3.9815673828125, 4.23095703125, 4.4803466796875, 4.729736328125, 4.9791259765625, 5.228515625, 5.4779052734375, 5.727294921875, 5.9766845703125, 6.22607421875, 6.4754638671875, 6.724853515625, 6.9742431640625, 7.2236328125, 7.4730224609375, 7.722412109375, 7.9718017578125, 8.22119140625, 8.4705810546875, 8.719970703125, 8.9693603515625, 9.21875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 10.0, 4.0, 7.0, 6.0, 9.0, 16.0, 10.0, 15.0, 22.0, 24.0, 29.0, 21.0, 49.0, 35.0, 39.0, 52.0, 61.0, 74.0, 72.0, 61.0, 50.0, 53.0, 48.0, 44.0, 42.0, 26.0, 21.0, 20.0, 16.0, 16.0, 14.0, 5.0, 8.0, 9.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-8.0625, -7.85089111328125, -7.6392822265625, -7.42767333984375, -7.216064453125, -7.00445556640625, -6.7928466796875, -6.58123779296875, -6.36962890625, -6.15802001953125, -5.9464111328125, -5.73480224609375, -5.523193359375, -5.31158447265625, -5.0999755859375, -4.88836669921875, -4.6767578125, -4.46514892578125, -4.2535400390625, -4.04193115234375, -3.830322265625, -3.61871337890625, -3.4071044921875, -3.19549560546875, -2.98388671875, -2.77227783203125, -2.5606689453125, -2.34906005859375, -2.137451171875, -1.92584228515625, -1.7142333984375, -1.50262451171875, -1.291015625, -1.07940673828125, -0.8677978515625, -0.65618896484375, -0.444580078125, -0.23297119140625, -0.0213623046875, 0.19024658203125, 0.40185546875, 0.61346435546875, 0.8250732421875, 1.03668212890625, 1.248291015625, 1.45989990234375, 1.6715087890625, 1.88311767578125, 2.0947265625, 2.30633544921875, 2.5179443359375, 2.72955322265625, 2.941162109375, 3.15277099609375, 3.3643798828125, 3.57598876953125, 3.78759765625, 3.99920654296875, 4.2108154296875, 4.42242431640625, 4.634033203125, 4.84564208984375, 5.0572509765625, 5.26885986328125, 5.48046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 1.0, 2.0, 5.0, 6.0, 9.0, 10.0, 11.0, 15.0, 34.0, 58.0, 115.0, 226.0, 637.0, 2135.0, 11358.0, 184979.0, 819045.0, 24804.0, 3499.0, 938.0, 311.0, 156.0, 84.0, 33.0, 26.0, 18.0, 9.0, 3.0, 7.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.314453125, -2.240203857421875, -2.16595458984375, -2.091705322265625, -2.0174560546875, -1.943206787109375, -1.86895751953125, -1.794708251953125, -1.720458984375, -1.646209716796875, -1.57196044921875, -1.497711181640625, -1.4234619140625, -1.349212646484375, -1.27496337890625, -1.200714111328125, -1.12646484375, -1.052215576171875, -0.97796630859375, -0.903717041015625, -0.8294677734375, -0.755218505859375, -0.68096923828125, -0.606719970703125, -0.532470703125, -0.458221435546875, -0.38397216796875, -0.309722900390625, -0.2354736328125, -0.161224365234375, -0.08697509765625, -0.012725830078125, 0.0615234375, 0.135772705078125, 0.21002197265625, 0.284271240234375, 0.3585205078125, 0.432769775390625, 0.50701904296875, 0.581268310546875, 0.655517578125, 0.729766845703125, 0.80401611328125, 0.878265380859375, 0.9525146484375, 1.026763916015625, 1.10101318359375, 1.175262451171875, 1.24951171875, 1.323760986328125, 1.39801025390625, 1.472259521484375, 1.5465087890625, 1.620758056640625, 1.69500732421875, 1.769256591796875, 1.843505859375, 1.917755126953125, 1.99200439453125, 2.066253662109375, 2.1405029296875, 2.214752197265625, 2.28900146484375, 2.363250732421875, 2.4375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 4.0, 8.0, 20.0, 19.0, 22.0, 45.0, 40.0, 83.0, 116.0, 161.0, 127.0, 100.0, 61.0, 52.0, 35.0, 21.0, 17.0, 15.0, 11.0, 8.0, 4.0, 1.0, 3.0, 3.0, 5.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007634162902832031, -0.0007437393069267273, -0.0007240623235702515, -0.0007043853402137756, -0.0006847083568572998, -0.000665031373500824, -0.0006453543901443481, -0.0006256774067878723, -0.0006060004234313965, -0.0005863234400749207, -0.0005666464567184448, -0.000546969473361969, -0.0005272924900054932, -0.0005076155066490173, -0.0004879385232925415, -0.0004682615399360657, -0.00044858455657958984, -0.000428907573223114, -0.0004092305898666382, -0.00038955360651016235, -0.0003698766231536865, -0.0003501996397972107, -0.00033052265644073486, -0.00031084567308425903, -0.0002911686897277832, -0.0002714917063713074, -0.00025181472301483154, -0.0002321377396583557, -0.00021246075630187988, -0.00019278377294540405, -0.00017310678958892822, -0.0001534298062324524, -0.00013375282287597656, -0.00011407583951950073, -9.43988561630249e-05, -7.472187280654907e-05, -5.504488945007324e-05, -3.536790609359741e-05, -1.5690922737121582e-05, 3.986060619354248e-06, 2.3663043975830078e-05, 4.334002733230591e-05, 6.301701068878174e-05, 8.269399404525757e-05, 0.0001023709774017334, 0.00012204796075820923, 0.00014172494411468506, 0.0001614019274711609, 0.00018107891082763672, 0.00020075589418411255, 0.00022043287754058838, 0.0002401098608970642, 0.00025978684425354004, 0.00027946382761001587, 0.0002991408109664917, 0.00031881779432296753, 0.00033849477767944336, 0.0003581717610359192, 0.000377848744392395, 0.00039752572774887085, 0.0004172027111053467, 0.0004368796944618225, 0.00045655667781829834, 0.00047623366117477417, 0.00049591064453125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 5.0, 10.0, 13.0, 16.0, 25.0, 61.0, 113.0, 306.0, 791.0, 2752.0, 19362.0, 896901.0, 119223.0, 6667.0, 1435.0, 495.0, 183.0, 87.0, 42.0, 21.0, 10.0, 9.0, 10.0, 6.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.6796875, -2.595306396484375, -2.51092529296875, -2.426544189453125, -2.3421630859375, -2.257781982421875, -2.17340087890625, -2.089019775390625, -2.004638671875, -1.920257568359375, -1.83587646484375, -1.751495361328125, -1.6671142578125, -1.582733154296875, -1.49835205078125, -1.413970947265625, -1.32958984375, -1.245208740234375, -1.16082763671875, -1.076446533203125, -0.9920654296875, -0.907684326171875, -0.82330322265625, -0.738922119140625, -0.654541015625, -0.570159912109375, -0.48577880859375, -0.401397705078125, -0.3170166015625, -0.232635498046875, -0.14825439453125, -0.063873291015625, 0.0205078125, 0.104888916015625, 0.18927001953125, 0.273651123046875, 0.3580322265625, 0.442413330078125, 0.52679443359375, 0.611175537109375, 0.695556640625, 0.779937744140625, 0.86431884765625, 0.948699951171875, 1.0330810546875, 1.117462158203125, 1.20184326171875, 1.286224365234375, 1.37060546875, 1.454986572265625, 1.53936767578125, 1.623748779296875, 1.7081298828125, 1.792510986328125, 1.87689208984375, 1.961273193359375, 2.045654296875, 2.130035400390625, 2.21441650390625, 2.298797607421875, 2.3831787109375, 2.467559814453125, 2.55194091796875, 2.636322021484375, 2.720703125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 10.0, 19.0, 16.0, 24.0, 38.0, 38.0, 58.0, 65.0, 80.0, 109.0, 115.0, 89.0, 70.0, 67.0, 58.0, 46.0, 38.0, 15.0, 14.0, 11.0, 9.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0546875, -1.0093536376953125, -0.964019775390625, -0.9186859130859375, -0.87335205078125, -0.8280181884765625, -0.782684326171875, -0.7373504638671875, -0.6920166015625, -0.6466827392578125, -0.601348876953125, -0.5560150146484375, -0.51068115234375, -0.4653472900390625, -0.420013427734375, -0.3746795654296875, -0.329345703125, -0.2840118408203125, -0.238677978515625, -0.1933441162109375, -0.14801025390625, -0.1026763916015625, -0.057342529296875, -0.0120086669921875, 0.0333251953125, 0.0786590576171875, 0.123992919921875, 0.1693267822265625, 0.21466064453125, 0.2599945068359375, 0.305328369140625, 0.3506622314453125, 0.39599609375, 0.4413299560546875, 0.486663818359375, 0.5319976806640625, 0.57733154296875, 0.6226654052734375, 0.667999267578125, 0.7133331298828125, 0.7586669921875, 0.8040008544921875, 0.849334716796875, 0.8946685791015625, 0.94000244140625, 0.9853363037109375, 1.030670166015625, 1.0760040283203125, 1.121337890625, 1.1666717529296875, 1.212005615234375, 1.2573394775390625, 1.30267333984375, 1.3480072021484375, 1.393341064453125, 1.4386749267578125, 1.4840087890625, 1.5293426513671875, 1.574676513671875, 1.6200103759765625, 1.66534423828125, 1.7106781005859375, 1.756011962890625, 1.8013458251953125, 1.8466796875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 14.0, 53.0, 147.0, 540.0, 168.0, 49.0, 16.0, 12.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.17497253417969, -50.9249267578125, -48.67487716674805, -46.424827575683594, -44.174781799316406, -41.92473602294922, -39.674686431884766, -37.42463684082031, -35.174591064453125, -32.92454528808594, -30.674495697021484, -28.424448013305664, -26.174400329589844, -23.924352645874023, -21.674304962158203, -19.424257278442383, -17.174209594726562, -14.924161911010742, -12.674114227294922, -10.424066543579102, -8.174018859863281, -5.923971176147461, -3.6739234924316406, -1.4238758087158203, 0.826171875, 3.0762195587158203, 5.326267242431641, 7.576314926147461, 9.826362609863281, 12.076410293579102, 14.326457977294922, 16.576505661010742, 18.82654571533203, 21.07659339904785, 23.326641082763672, 25.576688766479492, 27.826736450195312, 30.076784133911133, 32.32683181762695, 34.576881408691406, 36.826927185058594, 39.07697296142578, 41.327022552490234, 43.57707214355469, 45.827117919921875, 48.07716369628906, 50.327213287353516, 52.57726287841797, 54.827308654785156, 57.077354431152344, 59.3274040222168, 61.57745361328125, 63.82749938964844, 66.07754516601562, 68.32759094238281, 70.57764434814453, 72.82769012451172, 75.0777359008789, 77.32778930664062, 79.57783508300781, 81.827880859375, 84.07792663574219, 86.32797241210938, 88.5780258178711, 90.82807159423828]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 1.0, 4.0, 5.0, 7.0, 7.0, 3.0, 9.0, 12.0, 12.0, 12.0, 18.0, 19.0, 25.0, 27.0, 32.0, 30.0, 47.0, 49.0, 62.0, 166.0, 130.0, 54.0, 35.0, 26.0, 24.0, 27.0, 33.0, 23.0, 23.0, 11.0, 10.0, 9.0, 8.0, 7.0, 9.0, 4.0, 8.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.737560272216797, -24.816335678100586, -23.895112991333008, -22.973888397216797, -22.05266571044922, -21.131441116333008, -20.210216522216797, -19.28899383544922, -18.36777114868164, -17.44654655456543, -16.52532386779785, -15.60409927368164, -14.682876586914062, -13.761651992797852, -12.840428352355957, -11.919204711914062, -10.997980117797852, -10.076756477355957, -9.155532836914062, -8.234308242797852, -7.313085079193115, -6.391861438751221, -5.470637321472168, -4.549413681030273, -3.628190040588379, -2.7069664001464844, -1.7857425212860107, -0.8645186424255371, 0.05670499801635742, 0.977928638458252, 1.8991527557373047, 2.820376396179199, 3.7416000366210938, 4.662823677062988, 5.584047317504883, 6.5052714347839355, 7.42649507522583, 8.347719192504883, 9.268942832946777, 10.190166473388672, 11.111390113830566, 12.032613754272461, 12.953837394714355, 13.87506103515625, 14.796285629272461, 15.717508316040039, 16.63873291015625, 17.559955596923828, 18.48118019104004, 19.40240478515625, 20.323627471923828, 21.24485206604004, 22.166074752807617, 23.087299346923828, 24.008522033691406, 24.929746627807617, 25.850971221923828, 26.77219581604004, 27.693418502807617, 28.614643096923828, 29.535865783691406, 30.457090377807617, 31.378314971923828, 32.299537658691406, 33.220760345458984]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 8.0, 5.0, 8.0, 9.0, 22.0, 29.0, 34.0, 51.0, 72.0, 118.0, 145.0, 252.0, 331.0, 529.0, 758.0, 1205.0, 1883.0, 3344.0, 6463.0, 14014.0, 36382.0, 113533.0, 381158.0, 1078407.0, 1504190.0, 711489.0, 225960.0, 67973.0, 23736.0, 10175.0, 4996.0, 2629.0, 1533.0, 978.0, 587.0, 401.0, 299.0, 174.0, 148.0, 86.0, 58.0, 35.0, 31.0, 15.0, 12.0, 9.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-1.7880859375, -1.738800048828125, -1.68951416015625, -1.640228271484375, -1.5909423828125, -1.541656494140625, -1.49237060546875, -1.443084716796875, -1.393798828125, -1.344512939453125, -1.29522705078125, -1.245941162109375, -1.1966552734375, -1.147369384765625, -1.09808349609375, -1.048797607421875, -0.99951171875, -0.950225830078125, -0.90093994140625, -0.851654052734375, -0.8023681640625, -0.753082275390625, -0.70379638671875, -0.654510498046875, -0.605224609375, -0.555938720703125, -0.50665283203125, -0.457366943359375, -0.4080810546875, -0.358795166015625, -0.30950927734375, -0.260223388671875, -0.2109375, -0.161651611328125, -0.11236572265625, -0.063079833984375, -0.0137939453125, 0.035491943359375, 0.08477783203125, 0.134063720703125, 0.183349609375, 0.232635498046875, 0.28192138671875, 0.331207275390625, 0.3804931640625, 0.429779052734375, 0.47906494140625, 0.528350830078125, 0.57763671875, 0.626922607421875, 0.67620849609375, 0.725494384765625, 0.7747802734375, 0.824066162109375, 0.87335205078125, 0.922637939453125, 0.971923828125, 1.021209716796875, 1.07049560546875, 1.119781494140625, 1.1690673828125, 1.218353271484375, 1.26763916015625, 1.316925048828125, 1.3662109375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 3.0, 1.0, 6.0, 4.0, 14.0, 12.0, 13.0, 20.0, 20.0, 25.0, 39.0, 32.0, 34.0, 53.0, 49.0, 69.0, 57.0, 51.0, 63.0, 67.0, 50.0, 52.0, 47.0, 43.0, 41.0, 35.0, 28.0, 15.0, 12.0, 12.0, 18.0, 6.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.904296875, -1.8480224609375, -1.791748046875, -1.7354736328125, -1.67919921875, -1.6229248046875, -1.566650390625, -1.5103759765625, -1.4541015625, -1.3978271484375, -1.341552734375, -1.2852783203125, -1.22900390625, -1.1727294921875, -1.116455078125, -1.0601806640625, -1.00390625, -0.9476318359375, -0.891357421875, -0.8350830078125, -0.77880859375, -0.7225341796875, -0.666259765625, -0.6099853515625, -0.5537109375, -0.4974365234375, -0.441162109375, -0.3848876953125, -0.32861328125, -0.2723388671875, -0.216064453125, -0.1597900390625, -0.103515625, -0.0472412109375, 0.009033203125, 0.0653076171875, 0.12158203125, 0.1778564453125, 0.234130859375, 0.2904052734375, 0.3466796875, 0.4029541015625, 0.459228515625, 0.5155029296875, 0.57177734375, 0.6280517578125, 0.684326171875, 0.7406005859375, 0.796875, 0.8531494140625, 0.909423828125, 0.9656982421875, 1.02197265625, 1.0782470703125, 1.134521484375, 1.1907958984375, 1.2470703125, 1.3033447265625, 1.359619140625, 1.4158935546875, 1.47216796875, 1.5284423828125, 1.584716796875, 1.6409912109375, 1.697265625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 14.0, 41.0, 79.0, 135.0, 297.0, 671.0, 1878.0, 12823.0, 4052924.0, 120110.0, 3525.0, 947.0, 421.0, 201.0, 91.0, 54.0, 25.0, 14.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.96875, -15.5218505859375, -15.074951171875, -14.6280517578125, -14.18115234375, -13.7342529296875, -13.287353515625, -12.8404541015625, -12.3935546875, -11.9466552734375, -11.499755859375, -11.0528564453125, -10.60595703125, -10.1590576171875, -9.712158203125, -9.2652587890625, -8.818359375, -8.3714599609375, -7.924560546875, -7.4776611328125, -7.03076171875, -6.5838623046875, -6.136962890625, -5.6900634765625, -5.2431640625, -4.7962646484375, -4.349365234375, -3.9024658203125, -3.45556640625, -3.0086669921875, -2.561767578125, -2.1148681640625, -1.66796875, -1.2210693359375, -0.774169921875, -0.3272705078125, 0.11962890625, 0.5665283203125, 1.013427734375, 1.4603271484375, 1.9072265625, 2.3541259765625, 2.801025390625, 3.2479248046875, 3.69482421875, 4.1417236328125, 4.588623046875, 5.0355224609375, 5.482421875, 5.9293212890625, 6.376220703125, 6.8231201171875, 7.27001953125, 7.7169189453125, 8.163818359375, 8.6107177734375, 9.0576171875, 9.5045166015625, 9.951416015625, 10.3983154296875, 10.84521484375, 11.2921142578125, 11.739013671875, 12.1859130859375, 12.6328125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 8.0, 12.0, 10.0, 33.0, 43.0, 94.0, 151.0, 270.0, 490.0, 845.0, 870.0, 563.0, 318.0, 168.0, 96.0, 50.0, 24.0, 15.0, 11.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.0, -9.76263427734375, -9.5252685546875, -9.28790283203125, -9.050537109375, -8.81317138671875, -8.5758056640625, -8.33843994140625, -8.10107421875, -7.86370849609375, -7.6263427734375, -7.38897705078125, -7.151611328125, -6.91424560546875, -6.6768798828125, -6.43951416015625, -6.2021484375, -5.96478271484375, -5.7274169921875, -5.49005126953125, -5.252685546875, -5.01531982421875, -4.7779541015625, -4.54058837890625, -4.30322265625, -4.06585693359375, -3.8284912109375, -3.59112548828125, -3.353759765625, -3.11639404296875, -2.8790283203125, -2.64166259765625, -2.404296875, -2.16693115234375, -1.9295654296875, -1.69219970703125, -1.454833984375, -1.21746826171875, -0.9801025390625, -0.74273681640625, -0.50537109375, -0.26800537109375, -0.0306396484375, 0.20672607421875, 0.444091796875, 0.68145751953125, 0.9188232421875, 1.15618896484375, 1.3935546875, 1.63092041015625, 1.8682861328125, 2.10565185546875, 2.343017578125, 2.58038330078125, 2.8177490234375, 3.05511474609375, 3.29248046875, 3.52984619140625, 3.7672119140625, 4.00457763671875, 4.241943359375, 4.47930908203125, 4.7166748046875, 4.95404052734375, 5.19140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 7.0, 12.0, 18.0, 34.0, 57.0, 142.0, 226.0, 209.0, 130.0, 76.0, 36.0, 19.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.31403732299805, -46.12442398071289, -43.93480682373047, -41.74519348144531, -39.555580139160156, -37.365966796875, -35.176353454589844, -32.98673629760742, -30.797122955322266, -28.60750961303711, -26.41789436340332, -24.22827911376953, -22.038665771484375, -19.84905242919922, -17.65943717956543, -15.469822883605957, -13.280208587646484, -11.090594291687012, -8.900979995727539, -6.711365699768066, -4.521751403808594, -2.332137107849121, -0.14252281188964844, 2.047091484069824, 4.236705780029297, 6.4263200759887695, 8.615934371948242, 10.805548667907715, 12.995162963867188, 15.18477725982666, 17.374391555786133, 19.564006805419922, 21.753616333007812, 23.94322967529297, 26.132844924926758, 28.322460174560547, 30.512073516845703, 32.70168685913086, 34.89130401611328, 37.08091735839844, 39.270530700683594, 41.46014404296875, 43.649757385253906, 45.83937454223633, 48.028987884521484, 50.21860122680664, 52.40821838378906, 54.59783172607422, 56.787445068359375, 58.97705841064453, 61.16667175292969, 63.35628890991211, 65.5458984375, 67.73551940917969, 69.92513275146484, 72.11474609375, 74.30435943603516, 76.49397277832031, 78.68358612060547, 80.87319946289062, 83.06282043457031, 85.25243377685547, 87.44204711914062, 89.63166046142578, 91.82127380371094]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 7.0, 4.0, 12.0, 4.0, 7.0, 5.0, 16.0, 15.0, 21.0, 16.0, 26.0, 31.0, 30.0, 34.0, 42.0, 25.0, 50.0, 42.0, 63.0, 60.0, 73.0, 58.0, 57.0, 34.0, 39.0, 38.0, 25.0, 34.0, 27.0, 28.0, 12.0, 13.0, 16.0, 11.0, 11.0, 3.0, 7.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.599754333496094, -29.7222843170166, -28.84481430053711, -27.967344284057617, -27.089874267578125, -26.212404251098633, -25.33493423461914, -24.457462310791016, -23.579994201660156, -22.702524185180664, -21.825054168701172, -20.94758415222168, -20.070114135742188, -19.192644119262695, -18.315174102783203, -17.437702178955078, -16.560232162475586, -15.682762145996094, -14.805292129516602, -13.92782211303711, -13.050352096557617, -12.172882080078125, -11.295411109924316, -10.417941093444824, -9.540471076965332, -8.66300106048584, -7.785531044006348, -6.908060550689697, -6.030590534210205, -5.153120517730713, -4.2756500244140625, -3.3981800079345703, -2.520709991455078, -1.6432398557662964, -0.7657697200775146, 0.11170053482055664, 0.9891705513000488, 1.866640567779541, 2.7441110610961914, 3.6215810775756836, 4.499051094055176, 5.376521110534668, 6.25399112701416, 7.1314616203308105, 8.008932113647461, 8.886402130126953, 9.763872146606445, 10.641342163085938, 11.51881217956543, 12.396282196044922, 13.273752212524414, 14.151222229003906, 15.028692245483398, 15.90616226196289, 16.783634185791016, 17.661102294921875, 18.53857421875, 19.416044235229492, 20.293514251708984, 21.170984268188477, 22.04845428466797, 22.92592430114746, 23.803394317626953, 24.680866241455078, 25.558334350585938]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 8.0, 10.0, 10.0, 17.0, 11.0, 37.0, 29.0, 77.0, 120.0, 170.0, 323.0, 538.0, 875.0, 1702.0, 3602.0, 7877.0, 21013.0, 64934.0, 308108.0, 501410.0, 91578.0, 26940.0, 10131.0, 4304.0, 2109.0, 1138.0, 639.0, 323.0, 187.0, 114.0, 81.0, 52.0, 37.0, 9.0, 11.0, 13.0, 8.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.673828125, -2.58203125, -2.490234375, -2.3984375, -2.306640625, -2.21484375, -2.123046875, -2.03125, -1.939453125, -1.84765625, -1.755859375, -1.6640625, -1.572265625, -1.48046875, -1.388671875, -1.296875, -1.205078125, -1.11328125, -1.021484375, -0.9296875, -0.837890625, -0.74609375, -0.654296875, -0.5625, -0.470703125, -0.37890625, -0.287109375, -0.1953125, -0.103515625, -0.01171875, 0.080078125, 0.171875, 0.263671875, 0.35546875, 0.447265625, 0.5390625, 0.630859375, 0.72265625, 0.814453125, 0.90625, 0.998046875, 1.08984375, 1.181640625, 1.2734375, 1.365234375, 1.45703125, 1.548828125, 1.640625, 1.732421875, 1.82421875, 1.916015625, 2.0078125, 2.099609375, 2.19140625, 2.283203125, 2.375, 2.466796875, 2.55859375, 2.650390625, 2.7421875, 2.833984375, 2.92578125, 3.017578125, 3.109375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 4.0, 6.0, 10.0, 10.0, 13.0, 25.0, 20.0, 16.0, 31.0, 29.0, 34.0, 34.0, 44.0, 46.0, 56.0, 52.0, 57.0, 60.0, 68.0, 56.0, 49.0, 50.0, 32.0, 40.0, 26.0, 28.0, 27.0, 22.0, 18.0, 12.0, 9.0, 8.0, 8.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1796875, -2.1172637939453125, -2.054840087890625, -1.9924163818359375, -1.92999267578125, -1.8675689697265625, -1.805145263671875, -1.7427215576171875, -1.6802978515625, -1.6178741455078125, -1.555450439453125, -1.4930267333984375, -1.43060302734375, -1.3681793212890625, -1.305755615234375, -1.2433319091796875, -1.180908203125, -1.1184844970703125, -1.056060791015625, -0.9936370849609375, -0.93121337890625, -0.8687896728515625, -0.806365966796875, -0.7439422607421875, -0.6815185546875, -0.6190948486328125, -0.556671142578125, -0.4942474365234375, -0.43182373046875, -0.3694000244140625, -0.306976318359375, -0.2445526123046875, -0.18212890625, -0.1197052001953125, -0.057281494140625, 0.0051422119140625, 0.06756591796875, 0.1299896240234375, 0.192413330078125, 0.2548370361328125, 0.3172607421875, 0.3796844482421875, 0.442108154296875, 0.5045318603515625, 0.56695556640625, 0.6293792724609375, 0.691802978515625, 0.7542266845703125, 0.816650390625, 0.8790740966796875, 0.941497802734375, 1.0039215087890625, 1.06634521484375, 1.1287689208984375, 1.191192626953125, 1.2536163330078125, 1.3160400390625, 1.3784637451171875, 1.440887451171875, 1.5033111572265625, 1.56573486328125, 1.6281585693359375, 1.690582275390625, 1.7530059814453125, 1.8154296875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 13.0, 5.0, 15.0, 9.0, 24.0, 13.0, 27.0, 41.0, 63.0, 69.0, 162.0, 210.0, 353.0, 703.0, 1527.0, 4516.0, 22189.0, 254254.0, 730567.0, 25095.0, 5144.0, 1738.0, 733.0, 361.0, 241.0, 141.0, 92.0, 69.0, 36.0, 35.0, 17.0, 15.0, 16.0, 11.0, 5.0, 12.0, 7.0, 3.0, 4.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-4.86328125, -4.716064453125, -4.56884765625, -4.421630859375, -4.2744140625, -4.127197265625, -3.97998046875, -3.832763671875, -3.685546875, -3.538330078125, -3.39111328125, -3.243896484375, -3.0966796875, -2.949462890625, -2.80224609375, -2.655029296875, -2.5078125, -2.360595703125, -2.21337890625, -2.066162109375, -1.9189453125, -1.771728515625, -1.62451171875, -1.477294921875, -1.330078125, -1.182861328125, -1.03564453125, -0.888427734375, -0.7412109375, -0.593994140625, -0.44677734375, -0.299560546875, -0.15234375, -0.005126953125, 0.14208984375, 0.289306640625, 0.4365234375, 0.583740234375, 0.73095703125, 0.878173828125, 1.025390625, 1.172607421875, 1.31982421875, 1.467041015625, 1.6142578125, 1.761474609375, 1.90869140625, 2.055908203125, 2.203125, 2.350341796875, 2.49755859375, 2.644775390625, 2.7919921875, 2.939208984375, 3.08642578125, 3.233642578125, 3.380859375, 3.528076171875, 3.67529296875, 3.822509765625, 3.9697265625, 4.116943359375, 4.26416015625, 4.411376953125, 4.55859375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 7.0, 4.0, 11.0, 9.0, 15.0, 20.0, 17.0, 14.0, 17.0, 15.0, 31.0, 27.0, 28.0, 29.0, 52.0, 58.0, 63.0, 62.0, 69.0, 61.0, 57.0, 49.0, 50.0, 32.0, 41.0, 26.0, 17.0, 15.0, 15.0, 14.0, 13.0, 14.0, 11.0, 9.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.8515625, -6.622802734375, -6.39404296875, -6.165283203125, -5.9365234375, -5.707763671875, -5.47900390625, -5.250244140625, -5.021484375, -4.792724609375, -4.56396484375, -4.335205078125, -4.1064453125, -3.877685546875, -3.64892578125, -3.420166015625, -3.19140625, -2.962646484375, -2.73388671875, -2.505126953125, -2.2763671875, -2.047607421875, -1.81884765625, -1.590087890625, -1.361328125, -1.132568359375, -0.90380859375, -0.675048828125, -0.4462890625, -0.217529296875, 0.01123046875, 0.239990234375, 0.46875, 0.697509765625, 0.92626953125, 1.155029296875, 1.3837890625, 1.612548828125, 1.84130859375, 2.070068359375, 2.298828125, 2.527587890625, 2.75634765625, 2.985107421875, 3.2138671875, 3.442626953125, 3.67138671875, 3.900146484375, 4.12890625, 4.357666015625, 4.58642578125, 4.815185546875, 5.0439453125, 5.272705078125, 5.50146484375, 5.730224609375, 5.958984375, 6.187744140625, 6.41650390625, 6.645263671875, 6.8740234375, 7.102783203125, 7.33154296875, 7.560302734375, 7.7890625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 9.0, 2.0, 9.0, 10.0, 16.0, 27.0, 42.0, 51.0, 96.0, 128.0, 233.0, 419.0, 801.0, 2046.0, 6204.0, 28085.0, 794364.0, 187914.0, 19982.0, 4792.0, 1698.0, 734.0, 350.0, 195.0, 106.0, 65.0, 44.0, 42.0, 23.0, 16.0, 12.0, 6.0, 4.0, 5.0, 3.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.06640625, -1.0329742431640625, -0.999542236328125, -0.9661102294921875, -0.93267822265625, -0.8992462158203125, -0.865814208984375, -0.8323822021484375, -0.7989501953125, -0.7655181884765625, -0.732086181640625, -0.6986541748046875, -0.66522216796875, -0.6317901611328125, -0.598358154296875, -0.5649261474609375, -0.531494140625, -0.4980621337890625, -0.464630126953125, -0.4311981201171875, -0.39776611328125, -0.3643341064453125, -0.330902099609375, -0.2974700927734375, -0.2640380859375, -0.2306060791015625, -0.197174072265625, -0.1637420654296875, -0.13031005859375, -0.0968780517578125, -0.063446044921875, -0.0300140380859375, 0.00341796875, 0.0368499755859375, 0.070281982421875, 0.1037139892578125, 0.13714599609375, 0.1705780029296875, 0.204010009765625, 0.2374420166015625, 0.2708740234375, 0.3043060302734375, 0.337738037109375, 0.3711700439453125, 0.40460205078125, 0.4380340576171875, 0.471466064453125, 0.5048980712890625, 0.538330078125, 0.5717620849609375, 0.605194091796875, 0.6386260986328125, 0.67205810546875, 0.7054901123046875, 0.738922119140625, 0.7723541259765625, 0.8057861328125, 0.8392181396484375, 0.872650146484375, 0.9060821533203125, 0.93951416015625, 0.9729461669921875, 1.006378173828125, 1.0398101806640625, 1.0732421875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 14.0, 6.0, 6.0, 16.0, 19.0, 27.0, 28.0, 30.0, 44.0, 61.0, 118.0, 163.0, 136.0, 95.0, 51.0, 34.0, 26.0, 19.0, 18.0, 16.0, 11.0, 7.0, 7.0, 4.0, 6.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 8.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004456043243408203, -0.000431109219789505, -0.0004166141152381897, -0.0004021190106868744, -0.0003876239061355591, -0.0003731288015842438, -0.00035863369703292847, -0.00034413859248161316, -0.00032964348793029785, -0.00031514838337898254, -0.00030065327882766724, -0.00028615817427635193, -0.0002716630697250366, -0.0002571679651737213, -0.000242672860622406, -0.0002281777560710907, -0.0002136826515197754, -0.00019918754696846008, -0.00018469244241714478, -0.00017019733786582947, -0.00015570223331451416, -0.00014120712876319885, -0.00012671202421188354, -0.00011221691966056824, -9.772181510925293e-05, -8.322671055793762e-05, -6.873160600662231e-05, -5.423650145530701e-05, -3.97413969039917e-05, -2.524629235267639e-05, -1.0751187801361084e-05, 3.7439167499542236e-06, 1.823902130126953e-05, 3.273412585258484e-05, 4.7229230403900146e-05, 6.172433495521545e-05, 7.621943950653076e-05, 9.071454405784607e-05, 0.00010520964860916138, 0.00011970475316047668, 0.000134199857711792, 0.0001486949622631073, 0.0001631900668144226, 0.00017768517136573792, 0.00019218027591705322, 0.00020667538046836853, 0.00022117048501968384, 0.00023566558957099915, 0.00025016069412231445, 0.00026465579867362976, 0.00027915090322494507, 0.0002936460077762604, 0.0003081411123275757, 0.000322636216878891, 0.0003371313214302063, 0.0003516264259815216, 0.0003661215305328369, 0.0003806166350841522, 0.00039511173963546753, 0.00040960684418678284, 0.00042410194873809814, 0.00043859705328941345, 0.00045309215784072876, 0.00046758726239204407, 0.0004820823669433594]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 10.0, 12.0, 12.0, 17.0, 41.0, 60.0, 80.0, 117.0, 213.0, 391.0, 714.0, 1371.0, 2637.0, 6372.0, 18061.0, 73521.0, 815400.0, 94653.0, 21334.0, 7300.0, 2936.0, 1455.0, 770.0, 399.0, 235.0, 156.0, 90.0, 67.0, 43.0, 17.0, 20.0, 14.0, 8.0, 4.0, 5.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60546875, -0.5842742919921875, -0.563079833984375, -0.5418853759765625, -0.52069091796875, -0.4994964599609375, -0.478302001953125, -0.4571075439453125, -0.4359130859375, -0.4147186279296875, -0.393524169921875, -0.3723297119140625, -0.35113525390625, -0.3299407958984375, -0.308746337890625, -0.2875518798828125, -0.266357421875, -0.2451629638671875, -0.223968505859375, -0.2027740478515625, -0.18157958984375, -0.1603851318359375, -0.139190673828125, -0.1179962158203125, -0.0968017578125, -0.0756072998046875, -0.054412841796875, -0.0332183837890625, -0.01202392578125, 0.0091705322265625, 0.030364990234375, 0.0515594482421875, 0.07275390625, 0.0939483642578125, 0.115142822265625, 0.1363372802734375, 0.15753173828125, 0.1787261962890625, 0.199920654296875, 0.2211151123046875, 0.2423095703125, 0.2635040283203125, 0.284698486328125, 0.3058929443359375, 0.32708740234375, 0.3482818603515625, 0.369476318359375, 0.3906707763671875, 0.411865234375, 0.4330596923828125, 0.454254150390625, 0.4754486083984375, 0.49664306640625, 0.5178375244140625, 0.539031982421875, 0.5602264404296875, 0.5814208984375, 0.6026153564453125, 0.623809814453125, 0.6450042724609375, 0.66619873046875, 0.6873931884765625, 0.708587646484375, 0.7297821044921875, 0.7509765625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 12.0, 4.0, 2.0, 14.0, 14.0, 14.0, 19.0, 34.0, 42.0, 59.0, 91.0, 139.0, 124.0, 113.0, 84.0, 65.0, 38.0, 36.0, 20.0, 13.0, 12.0, 3.0, 7.0, 7.0, 8.0, 4.0, 7.0, 4.0, 6.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.89599609375, -0.868377685546875, -0.84075927734375, -0.813140869140625, -0.7855224609375, -0.757904052734375, -0.73028564453125, -0.702667236328125, -0.675048828125, -0.647430419921875, -0.61981201171875, -0.592193603515625, -0.5645751953125, -0.536956787109375, -0.50933837890625, -0.481719970703125, -0.4541015625, -0.426483154296875, -0.39886474609375, -0.371246337890625, -0.3436279296875, -0.316009521484375, -0.28839111328125, -0.260772705078125, -0.233154296875, -0.205535888671875, -0.17791748046875, -0.150299072265625, -0.1226806640625, -0.095062255859375, -0.06744384765625, -0.039825439453125, -0.01220703125, 0.015411376953125, 0.04302978515625, 0.070648193359375, 0.0982666015625, 0.125885009765625, 0.15350341796875, 0.181121826171875, 0.208740234375, 0.236358642578125, 0.26397705078125, 0.291595458984375, 0.3192138671875, 0.346832275390625, 0.37445068359375, 0.402069091796875, 0.4296875, 0.457305908203125, 0.48492431640625, 0.512542724609375, 0.5401611328125, 0.567779541015625, 0.59539794921875, 0.623016357421875, 0.650634765625, 0.678253173828125, 0.70587158203125, 0.733489990234375, 0.7611083984375, 0.788726806640625, 0.81634521484375, 0.843963623046875, 0.87158203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 9.0, 44.0, 141.0, 623.0, 110.0, 42.0, 15.0, 7.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.31908416748047, -54.255455017089844, -52.191829681396484, -50.128204345703125, -48.0645751953125, -46.000946044921875, -43.937320709228516, -41.873695373535156, -39.81006622314453, -37.746437072753906, -35.68281173706055, -33.61918640136719, -31.555557250976562, -29.49193000793457, -27.428302764892578, -25.364675521850586, -23.301048278808594, -21.2374210357666, -19.17379379272461, -17.110166549682617, -15.046539306640625, -12.982912063598633, -10.91928482055664, -8.855657577514648, -6.792030334472656, -4.728403091430664, -2.664775848388672, -0.6011486053466797, 1.4624786376953125, 3.5261058807373047, 5.589733123779297, 7.653360366821289, 9.716987609863281, 11.780614852905273, 13.844242095947266, 15.907869338989258, 17.97149658203125, 20.035123825073242, 22.098751068115234, 24.162378311157227, 26.22600555419922, 28.28963279724121, 30.353260040283203, 32.41688537597656, 34.48051452636719, 36.54414367675781, 38.60776901245117, 40.67139434814453, 42.735023498535156, 44.79865264892578, 46.86227798461914, 48.9259033203125, 50.989532470703125, 53.05316162109375, 55.11678695678711, 57.18041229248047, 59.244041442871094, 61.30767059326172, 63.37129592895508, 65.43492126464844, 67.49855041503906, 69.56217956542969, 71.62580871582031, 73.6894302368164, 75.75305938720703]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 5.0, 5.0, 6.0, 4.0, 4.0, 6.0, 9.0, 17.0, 17.0, 23.0, 18.0, 23.0, 27.0, 25.0, 23.0, 47.0, 306.0, 175.0, 47.0, 39.0, 18.0, 24.0, 26.0, 26.0, 17.0, 20.0, 11.0, 15.0, 7.0, 8.0, 5.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0], "bins": [-28.446056365966797, -27.714139938354492, -26.982223510742188, -26.25030517578125, -25.518388748168945, -24.78647232055664, -24.054555892944336, -23.32263946533203, -22.590721130371094, -21.85880470275879, -21.126888275146484, -20.394969940185547, -19.663053512573242, -18.931137084960938, -18.199220657348633, -17.467304229736328, -16.73538589477539, -16.003469467163086, -15.271552085876465, -14.53963565826416, -13.807718276977539, -13.075801849365234, -12.34388542175293, -11.611968040466309, -10.88005256652832, -10.148136138916016, -9.416218757629395, -8.68430233001709, -7.952384948730469, -7.220468521118164, -6.488551616668701, -5.756634712219238, -5.024717330932617, -4.292800426483154, -3.5608835220336914, -2.8289668560028076, -2.0970499515533447, -1.3651330471038818, -0.633216381072998, 0.09870052337646484, 0.8306174278259277, 1.5625343322753906, 2.2944512367248535, 3.0263679027557373, 3.7582848072052, 4.490201950073242, 5.222118377685547, 5.95403528213501, 6.685952186584473, 7.4178690910339355, 8.149785995483398, 8.881702423095703, 9.613619804382324, 10.345536231994629, 11.07745361328125, 11.809370040893555, 12.54128646850586, 13.273202896118164, 14.005120277404785, 14.73703670501709, 15.468954086303711, 16.200870513916016, 16.93278694152832, 17.664703369140625, 18.396621704101562]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 4.0, 6.0, 8.0, 10.0, 10.0, 14.0, 15.0, 19.0, 18.0, 26.0, 27.0, 37.0, 54.0, 116.0, 227.0, 80.0, 48.0, 37.0, 37.0, 31.0, 27.0, 17.0, 27.0, 20.0, 15.0, 20.0, 10.0, 9.0, 7.0, 7.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9755859375, -1.9196624755859375, -1.863739013671875, -1.8078155517578125, -1.75189208984375, -1.6959686279296875, -1.640045166015625, -1.5841217041015625, -1.5281982421875, -1.4722747802734375, -1.416351318359375, -1.3604278564453125, -1.30450439453125, -1.2485809326171875, -1.192657470703125, -1.1367340087890625, -1.080810546875, -1.0248870849609375, -0.968963623046875, -0.9130401611328125, -0.85711669921875, -0.8011932373046875, -0.745269775390625, -0.6893463134765625, -0.6334228515625, -0.5774993896484375, -0.521575927734375, -0.4656524658203125, -0.40972900390625, -0.3538055419921875, -0.297882080078125, -0.2419586181640625, -0.18603515625, -0.1301116943359375, -0.074188232421875, -0.0182647705078125, 0.03765869140625, 0.0935821533203125, 0.149505615234375, 0.2054290771484375, 0.2613525390625, 0.3172760009765625, 0.373199462890625, 0.4291229248046875, 0.48504638671875, 0.5409698486328125, 0.596893310546875, 0.6528167724609375, 0.708740234375, 0.7646636962890625, 0.820587158203125, 0.8765106201171875, 0.93243408203125, 0.9883575439453125, 1.044281005859375, 1.1002044677734375, 1.1561279296875, 1.2120513916015625, 1.267974853515625, 1.3238983154296875, 1.37982177734375, 1.4357452392578125, 1.491668701171875, 1.5475921630859375, 1.603515625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 1.0, 0.0, 4.0, 3.0, 2.0, 9.0, 10.0, 17.0, 20.0, 26.0, 64.0, 116.0, 265.0, 1016.0, 9504.0, 8368594.0, 7514.0, 919.0, 240.0, 119.0, 43.0, 38.0, 16.0, 11.0, 3.0, 11.0, 8.0, 1.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0], "bins": [-32.96440887451172, -31.949037551879883, -30.933664321899414, -29.918292999267578, -28.90291976928711, -27.887548446655273, -26.872177124023438, -25.85680389404297, -24.8414306640625, -23.826059341430664, -22.810686111450195, -21.79531478881836, -20.77994155883789, -19.764570236206055, -18.74919891357422, -17.73382568359375, -16.718454360961914, -15.703082084655762, -14.68770980834961, -13.672338485717773, -12.656965255737305, -11.641593933105469, -10.626221656799316, -9.610849380493164, -8.595477104187012, -7.580104827880859, -6.564732551574707, -5.549360752105713, -4.5339884757995605, -3.518616199493408, -2.503244400024414, -1.4878721237182617, -0.4724998474121094, 0.5428723096847534, 1.5582444667816162, 2.5736165046691895, 3.588988780975342, 4.604361057281494, 5.619732856750488, 6.635105133056641, 7.650477409362793, 8.665849685668945, 9.681221961975098, 10.69659423828125, 11.711965560913086, 12.727338790893555, 13.74271011352539, 14.758082389831543, 15.773454666137695, 16.78882598876953, 17.80419921875, 18.819570541381836, 19.834943771362305, 20.85031509399414, 21.86568832397461, 22.881059646606445, 23.89643096923828, 24.911802291870117, 25.927175521850586, 26.942546844482422, 27.95792007446289, 28.973291397094727, 29.988662719726562, 31.00403594970703, 32.0194091796875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 6.0, 3.0, 3.0, 4.0, 1.0, 8.0, 7.0, 3.0, 8.0, 10.0, 6.0, 1.0, 4.0, 3.0, 3.0, 6.0, 5.0, 2.0, 0.0, 7.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.974762916564941, -8.476577758789062, -7.978392601013184, -7.480207443237305, -6.982022285461426, -6.483837127685547, -5.98565149307251, -5.487466335296631, -4.989281177520752, -4.491096019744873, -3.992910861968994, -3.494725465774536, -2.9965403079986572, -2.4983551502227783, -2.0001697540283203, -1.5019845962524414, -1.0037994384765625, -0.5056142210960388, -0.007429003715515137, 0.4907562732696533, 0.9889414310455322, 1.4871265888214111, 1.9853119850158691, 2.483497142791748, 2.981682300567627, 3.479867458343506, 3.9780526161193848, 4.476238250732422, 4.974423408508301, 5.47260856628418, 5.970793724060059, 6.4689788818359375, 6.9671630859375, 7.465348243713379, 7.963533401489258, 8.461718559265137, 8.959903717041016, 9.458088874816895, 9.956274032592773, 10.454460144042969, 10.952644348144531, 11.45082950592041, 11.949014663696289, 12.447199821472168, 12.945384979248047, 13.443570137023926, 13.941755294799805, 14.43994140625, 14.938126564025879, 15.436311721801758, 15.934496879577637, 16.432682037353516, 16.93086814880371, 17.429052352905273, 17.92723846435547, 18.42542266845703, 18.923608779907227, 19.421794891357422, 19.919979095458984, 20.41816520690918, 20.916349411010742, 21.414535522460938, 21.9127197265625, 22.410905838012695, 22.909090042114258]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 15.0, 18.0, 19.0, 33.0, 50.0, 76.0, 131.0, 217.0, 415.0, 742.0, 1623.0, 4054.0, 12770.0, 50350.0, 214001.0, 182982.0, 40457.0, 10243.0, 3254.0, 1315.0, 631.0, 333.0, 180.0, 121.0, 78.0, 47.0, 30.0, 23.0, 15.0, 8.0, 7.0, 9.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.46875, -17.890380859375, -17.31201171875, -16.733642578125, -16.1552734375, -15.576904296875, -14.99853515625, -14.420166015625, -13.841796875, -13.263427734375, -12.68505859375, -12.106689453125, -11.5283203125, -10.949951171875, -10.37158203125, -9.793212890625, -9.21484375, -8.636474609375, -8.05810546875, -7.479736328125, -6.9013671875, -6.322998046875, -5.74462890625, -5.166259765625, -4.587890625, -4.009521484375, -3.43115234375, -2.852783203125, -2.2744140625, -1.696044921875, -1.11767578125, -0.539306640625, 0.0390625, 0.617431640625, 1.19580078125, 1.774169921875, 2.3525390625, 2.930908203125, 3.50927734375, 4.087646484375, 4.666015625, 5.244384765625, 5.82275390625, 6.401123046875, 6.9794921875, 7.557861328125, 8.13623046875, 8.714599609375, 9.29296875, 9.871337890625, 10.44970703125, 11.028076171875, 11.6064453125, 12.184814453125, 12.76318359375, 13.341552734375, 13.919921875, 14.498291015625, 15.07666015625, 15.655029296875, 16.2333984375, 16.811767578125, 17.39013671875, 17.968505859375, 18.546875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 7.0, 7.0, 9.0, 9.0, 16.0, 18.0, 16.0, 33.0, 35.0, 43.0, 54.0, 68.0, 83.0, 94.0, 100.0, 75.0, 80.0, 59.0, 45.0, 44.0, 31.0, 27.0, 13.0, 15.0, 13.0, 6.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.853515625, -2.772705078125, -2.69189453125, -2.611083984375, -2.5302734375, -2.449462890625, -2.36865234375, -2.287841796875, -2.20703125, -2.126220703125, -2.04541015625, -1.964599609375, -1.8837890625, -1.802978515625, -1.72216796875, -1.641357421875, -1.560546875, -1.479736328125, -1.39892578125, -1.318115234375, -1.2373046875, -1.156494140625, -1.07568359375, -0.994873046875, -0.9140625, -0.833251953125, -0.75244140625, -0.671630859375, -0.5908203125, -0.510009765625, -0.42919921875, -0.348388671875, -0.267578125, -0.186767578125, -0.10595703125, -0.025146484375, 0.0556640625, 0.136474609375, 0.21728515625, 0.298095703125, 0.37890625, 0.459716796875, 0.54052734375, 0.621337890625, 0.7021484375, 0.782958984375, 0.86376953125, 0.944580078125, 1.025390625, 1.106201171875, 1.18701171875, 1.267822265625, 1.3486328125, 1.429443359375, 1.51025390625, 1.591064453125, 1.671875, 1.752685546875, 1.83349609375, 1.914306640625, 1.9951171875, 2.075927734375, 2.15673828125, 2.237548828125, 2.318359375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 4.0, 3.0, 7.0, 4.0, 6.0, 15.0, 16.0, 25.0, 57.0, 76.0, 74.0, 64.0, 51.0, 21.0, 15.0, 15.0, 8.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.403003692626953, -15.927031517028809, -15.451059341430664, -14.975088119506836, -14.499115943908691, -14.023143768310547, -13.547171592712402, -13.071199417114258, -12.59522819519043, -12.119256019592285, -11.64328384399414, -11.167312622070312, -10.691340446472168, -10.215368270874023, -9.739396095275879, -9.263423919677734, -8.78745174407959, -8.311479568481445, -7.835507869720459, -7.3595356941223145, -6.883563995361328, -6.407591819763184, -5.931619644165039, -5.4556474685668945, -4.979675769805908, -4.503703594207764, -4.027731895446777, -3.551759719848633, -3.0757877826690674, -2.599815845489502, -2.1238436698913574, -1.647871732711792, -1.1718988418579102, -0.6959268450737, -0.21995484828948975, 0.25601720809936523, 0.7319891452789307, 1.207961082458496, 1.6839332580566406, 2.159905195236206, 2.6358771324157715, 3.111849069595337, 3.5878210067749023, 4.063793182373047, 4.539765357971191, 5.015737056732178, 5.491709232330322, 5.967680931091309, 6.443653106689453, 6.919625282287598, 7.395596981048584, 7.8715691566467285, 8.347540855407715, 8.82351303100586, 9.299485206604004, 9.775457382202148, 10.251428604125977, 10.727400779724121, 11.203372955322266, 11.679344177246094, 12.155316352844238, 12.631288528442383, 13.107260704040527, 13.583232879638672, 14.059205055236816]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 5.0, 9.0, 3.0, 13.0, 9.0, 23.0, 35.0, 57.0, 65.0, 54.0, 63.0, 42.0, 37.0, 14.0, 9.0, 3.0, 9.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 0.0, 1.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.323083877563477, -9.005084037780762, -8.687085151672363, -8.369085311889648, -8.05108642578125, -7.733086585998535, -7.4150872230529785, -7.097087860107422, -6.779088020324707, -6.46108865737915, -6.143089294433594, -5.825089454650879, -5.507090091705322, -5.189090728759766, -4.871091365814209, -4.553092002868652, -4.235092639923096, -3.917093276977539, -3.5990936756134033, -3.2810943126678467, -2.963094711303711, -2.6450953483581543, -2.3270959854125977, -2.009096384048462, -1.6910970211029053, -1.373097538948059, -1.055098056793213, -0.7370986938476562, -0.41909921169281006, -0.10109972953796387, 0.21689963340759277, 0.5348992347717285, 0.8528985977172852, 1.1708980798721313, 1.4888975620269775, 1.8068969249725342, 2.12489652633667, 2.4428958892822266, 2.760895252227783, 3.078894853591919, 3.3968942165374756, 3.7148935794830322, 4.032893180847168, 4.350892543792725, 4.668891906738281, 4.986891746520996, 5.3048906326293945, 5.622890472412109, 5.940889835357666, 6.258889198303223, 6.576888561248779, 6.894887924194336, 7.212887763977051, 7.530887126922607, 7.848886489868164, 8.166886329650879, 8.484885215759277, 8.802885055541992, 9.12088394165039, 9.438883781433105, 9.756882667541504, 10.074882507324219, 10.392881393432617, 10.710881233215332, 11.028881072998047]}, "_wandb": {"runtime": 4137}} \ No newline at end of file