diff --git "a/wandb/run-20220301_141622-dv1pefph/files/wandb-summary.json" "b/wandb/run-20220301_141622-dv1pefph/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220301_141622-dv1pefph/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 5.334, "train/learning_rate": 2.976e-05, "train/epoch": 0.49, "train/global_step": 500, "_runtime": 2307, "_timestamp": 1646146489, "_step": 499, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 9.0, 31.0, 175.0, 527.0, 199.0, 55.0, 15.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-63.70233917236328, -55.255706787109375, -46.809078216552734, -38.362449645996094, -29.915817260742188, -21.46918487548828, -13.02255630493164, -4.575927734375, 3.8707046508789062, 12.31733512878418, 20.763965606689453, 29.210596084594727, 37.6572265625, 46.103858947753906, 54.55048751831055, 62.99711608886719, 71.4437484741211, 79.890380859375, 88.33700561523438, 96.78363800048828, 105.23027038574219, 113.6769027709961, 122.12353515625, 130.57015991210938, 139.01678466796875, 147.46340942382812, 155.91004943847656, 164.35667419433594, 172.80331420898438, 181.24993896484375, 189.69656372070312, 198.1431884765625, 206.58984375, 215.03646850585938, 223.4831085205078, 231.9297332763672, 240.37637329101562, 248.822998046875, 257.2696228027344, 265.71624755859375, 274.16290283203125, 282.6095275878906, 291.05615234375, 299.5028076171875, 307.9494323730469, 316.39605712890625, 324.8426818847656, 333.289306640625, 341.7359313964844, 350.18255615234375, 358.6291809082031, 367.0758361816406, 375.5224609375, 383.9690856933594, 392.41571044921875, 400.8623352050781, 409.3089599609375, 417.7555847167969, 426.20220947265625, 434.64886474609375, 443.0954895019531, 451.5421142578125, 459.9887390136719, 468.43536376953125, 476.88201904296875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 2.0, 3.0, 4.0, 5.0, 6.0, 12.0, 15.0, 14.0, 17.0, 12.0, 29.0, 19.0, 30.0, 25.0, 36.0, 30.0, 31.0, 38.0, 37.0, 45.0, 48.0, 51.0, 44.0, 33.0, 56.0, 39.0, 34.0, 37.0, 28.0, 43.0, 38.0, 21.0, 11.0, 19.0, 17.0, 20.0, 11.0, 15.0, 7.0, 6.0, 8.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.18853759765625, -85.23828125, -82.28802490234375, -79.3377685546875, -76.38751220703125, -73.437255859375, -70.48699951171875, -67.53673553466797, -64.58647918701172, -61.63622283935547, -58.68596649169922, -55.73571014404297, -52.78544998168945, -49.8351936340332, -46.88493728637695, -43.93467712402344, -40.98442459106445, -38.0341682434082, -35.08391189575195, -32.13365173339844, -29.183395385742188, -26.233139038085938, -23.282882690429688, -20.332624435424805, -17.382368087768555, -14.432110786437988, -11.481853485107422, -8.531597137451172, -5.5813398361206055, -2.631082534790039, 0.31917381286621094, 3.2694320678710938, 6.219688415527344, 9.16994571685791, 12.120203018188477, 15.070459365844727, 18.02071762084961, 20.97097396850586, 23.92123031616211, 26.871488571166992, 29.821744918823242, 32.772003173828125, 35.722259521484375, 38.672515869140625, 41.622772216796875, 44.573028564453125, 47.523284912109375, 50.47354507446289, 53.42380142211914, 56.37405776977539, 59.32431411743164, 62.274574279785156, 65.2248306274414, 68.17508697509766, 71.1253433227539, 74.07559967041016, 77.0258560180664, 79.97611236572266, 82.9263687133789, 85.87662506103516, 88.8268814086914, 91.77714538574219, 94.72740173339844, 97.67765808105469, 100.62791442871094]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 11.0, 10.0, 21.0, 29.0, 59.0, 78.0, 71.0, 94.0, 107.0, 110.0, 101.0, 99.0, 58.0, 52.0, 39.0, 29.0, 17.0, 9.0, 4.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.625, -16.1368408203125, -15.648681640625, -15.1605224609375, -14.67236328125, -14.1842041015625, -13.696044921875, -13.2078857421875, -12.7197265625, -12.2315673828125, -11.743408203125, -11.2552490234375, -10.76708984375, -10.2789306640625, -9.790771484375, -9.3026123046875, -8.814453125, -8.3262939453125, -7.838134765625, -7.3499755859375, -6.86181640625, -6.3736572265625, -5.885498046875, -5.3973388671875, -4.9091796875, -4.4210205078125, -3.932861328125, -3.4447021484375, -2.95654296875, -2.4683837890625, -1.980224609375, -1.4920654296875, -1.00390625, -0.5157470703125, -0.027587890625, 0.4605712890625, 0.94873046875, 1.4368896484375, 1.925048828125, 2.4132080078125, 2.9013671875, 3.3895263671875, 3.877685546875, 4.3658447265625, 4.85400390625, 5.3421630859375, 5.830322265625, 6.3184814453125, 6.806640625, 7.2947998046875, 7.782958984375, 8.2711181640625, 8.75927734375, 9.2474365234375, 9.735595703125, 10.2237548828125, 10.7119140625, 11.2000732421875, 11.688232421875, 12.1763916015625, 12.66455078125, 13.1527099609375, 13.640869140625, 14.1290283203125, 14.6171875]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 0.0, 3.0, 2.0, 3.0, 8.0, 6.0, 7.0, 7.0, 9.0, 9.0, 19.0, 9.0, 17.0, 31.0, 50.0, 59.0, 108.0, 137.0, 289.0, 572.0, 1225.0, 3034.0, 11376.0, 79428.0, 3818046.0, 254957.0, 17307.0, 4736.0, 1511.0, 651.0, 301.0, 158.0, 76.0, 42.0, 29.0, 18.0, 14.0, 12.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-47.65625, -46.31884765625, -44.9814453125, -43.64404296875, -42.306640625, -40.96923828125, -39.6318359375, -38.29443359375, -36.95703125, -35.61962890625, -34.2822265625, -32.94482421875, -31.607421875, -30.27001953125, -28.9326171875, -27.59521484375, -26.2578125, -24.92041015625, -23.5830078125, -22.24560546875, -20.908203125, -19.57080078125, -18.2333984375, -16.89599609375, -15.55859375, -14.22119140625, -12.8837890625, -11.54638671875, -10.208984375, -8.87158203125, -7.5341796875, -6.19677734375, -4.859375, -3.52197265625, -2.1845703125, -0.84716796875, 0.490234375, 1.82763671875, 3.1650390625, 4.50244140625, 5.83984375, 7.17724609375, 8.5146484375, 9.85205078125, 11.189453125, 12.52685546875, 13.8642578125, 15.20166015625, 16.5390625, 17.87646484375, 19.2138671875, 20.55126953125, 21.888671875, 23.22607421875, 24.5634765625, 25.90087890625, 27.23828125, 28.57568359375, 29.9130859375, 31.25048828125, 32.587890625, 33.92529296875, 35.2626953125, 36.60009765625, 37.9375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 6.0, 11.0, 10.0, 15.0, 25.0, 31.0, 23.0, 53.0, 104.0, 208.0, 518.0, 1316.0, 1032.0, 387.0, 146.0, 76.0, 48.0, 20.0, 21.0, 9.0, 8.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-69.0625, -67.486083984375, -65.90966796875, -64.333251953125, -62.7568359375, -61.180419921875, -59.60400390625, -58.027587890625, -56.451171875, -54.874755859375, -53.29833984375, -51.721923828125, -50.1455078125, -48.569091796875, -46.99267578125, -45.416259765625, -43.83984375, -42.263427734375, -40.68701171875, -39.110595703125, -37.5341796875, -35.957763671875, -34.38134765625, -32.804931640625, -31.228515625, -29.652099609375, -28.07568359375, -26.499267578125, -24.9228515625, -23.346435546875, -21.77001953125, -20.193603515625, -18.6171875, -17.040771484375, -15.46435546875, -13.887939453125, -12.3115234375, -10.735107421875, -9.15869140625, -7.582275390625, -6.005859375, -4.429443359375, -2.85302734375, -1.276611328125, 0.2998046875, 1.876220703125, 3.45263671875, 5.029052734375, 6.60546875, 8.181884765625, 9.75830078125, 11.334716796875, 12.9111328125, 14.487548828125, 16.06396484375, 17.640380859375, 19.216796875, 20.793212890625, 22.36962890625, 23.946044921875, 25.5224609375, 27.098876953125, 28.67529296875, 30.251708984375, 31.828125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 8.0, 16.0, 28.0, 35.0, 58.0, 84.0, 122.0, 266.0, 732.0, 6688.0, 3940210.0, 242084.0, 2987.0, 473.0, 232.0, 114.0, 68.0, 32.0, 26.0, 9.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-229.75, -223.517578125, -217.28515625, -211.052734375, -204.8203125, -198.587890625, -192.35546875, -186.123046875, -179.890625, -173.658203125, -167.42578125, -161.193359375, -154.9609375, -148.728515625, -142.49609375, -136.263671875, -130.03125, -123.798828125, -117.56640625, -111.333984375, -105.1015625, -98.869140625, -92.63671875, -86.404296875, -80.171875, -73.939453125, -67.70703125, -61.474609375, -55.2421875, -49.009765625, -42.77734375, -36.544921875, -30.3125, -24.080078125, -17.84765625, -11.615234375, -5.3828125, 0.849609375, 7.08203125, 13.314453125, 19.546875, 25.779296875, 32.01171875, 38.244140625, 44.4765625, 50.708984375, 56.94140625, 63.173828125, 69.40625, 75.638671875, 81.87109375, 88.103515625, 94.3359375, 100.568359375, 106.80078125, 113.033203125, 119.265625, 125.498046875, 131.73046875, 137.962890625, 144.1953125, 150.427734375, 156.66015625, 162.892578125, 169.125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 8.0, 40.0, 78.0, 325.0, 444.0, 93.0, 14.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-216.6140899658203, -207.62353515625, -198.63299560546875, -189.64244079589844, -180.65188598632812, -171.66134643554688, -162.67079162597656, -153.68023681640625, -144.689697265625, -135.6991424560547, -126.7085952758789, -117.71804809570312, -108.72749328613281, -99.73694610595703, -90.74639892578125, -81.75584411621094, -72.76528930664062, -63.77473831176758, -54.78418731689453, -45.79364013671875, -36.8030891418457, -27.812538146972656, -18.821990966796875, -9.831439971923828, -0.8408889770507812, 8.14966106414795, 17.14021110534668, 26.130760192871094, 35.12131118774414, 44.11186218261719, 53.10240936279297, 62.092960357666016, 71.08349609375, 80.07404327392578, 89.0645980834961, 98.05514526367188, 107.04570007324219, 116.03624725341797, 125.02679443359375, 134.01734924316406, 143.00790405273438, 151.9984588623047, 160.98899841308594, 169.97955322265625, 178.97010803222656, 187.96066284179688, 196.95120239257812, 205.94175720214844, 214.9322967529297, 223.9228515625, 232.91339111328125, 241.90394592285156, 250.89450073242188, 259.8850402832031, 268.8756103515625, 277.86614990234375, 286.856689453125, 295.84722900390625, 304.8377990722656, 313.8283386230469, 322.8188781738281, 331.8094482421875, 340.79998779296875, 349.79052734375, 358.7810974121094]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 6.0, 6.0, 11.0, 15.0, 15.0, 16.0, 24.0, 36.0, 30.0, 35.0, 44.0, 45.0, 43.0, 41.0, 43.0, 46.0, 53.0, 49.0, 46.0, 50.0, 60.0, 38.0, 40.0, 41.0, 36.0, 27.0, 19.0, 22.0, 14.0, 18.0, 10.0, 7.0, 6.0, 4.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-97.15975952148438, -93.80370330810547, -90.4476547241211, -87.09159851074219, -83.73554992675781, -80.3794937133789, -77.0234375, -73.66738891601562, -70.31134033203125, -66.95528411865234, -63.59923553466797, -60.24317932128906, -56.88713073730469, -53.53107452392578, -50.17502212524414, -46.8189697265625, -43.462913513183594, -40.10686111450195, -36.75080871582031, -33.394752502441406, -30.0387020111084, -26.682649612426758, -23.326595306396484, -19.970542907714844, -16.614490509033203, -13.258438110351562, -9.902384757995605, -6.546331405639648, -3.190279006958008, 0.1657733917236328, 3.5218276977539062, 6.877880096435547, 10.233924865722656, 13.589977264404297, 16.946029663085938, 20.30208396911621, 23.65813636779785, 27.014188766479492, 30.370243072509766, 33.726295471191406, 37.08234786987305, 40.43840026855469, 43.79445266723633, 47.15050506591797, 50.506561279296875, 53.86260986328125, 57.218666076660156, 60.5747184753418, 63.93077087402344, 67.28682708740234, 70.64287567138672, 73.99893188476562, 77.35498046875, 80.7110366821289, 84.06709289550781, 87.42314147949219, 90.77919006347656, 94.13524627685547, 97.49129486083984, 100.84735107421875, 104.20339965820312, 107.55945587158203, 110.91551208496094, 114.27156066894531, 117.62761688232422]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 10.0, 16.0, 21.0, 40.0, 42.0, 49.0, 63.0, 75.0, 71.0, 100.0, 96.0, 97.0, 73.0, 62.0, 58.0, 40.0, 37.0, 18.0, 10.0, 8.0, 3.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5703125, -15.1124267578125, -14.654541015625, -14.1966552734375, -13.73876953125, -13.2808837890625, -12.822998046875, -12.3651123046875, -11.9072265625, -11.4493408203125, -10.991455078125, -10.5335693359375, -10.07568359375, -9.6177978515625, -9.159912109375, -8.7020263671875, -8.244140625, -7.7862548828125, -7.328369140625, -6.8704833984375, -6.41259765625, -5.9547119140625, -5.496826171875, -5.0389404296875, -4.5810546875, -4.1231689453125, -3.665283203125, -3.2073974609375, -2.74951171875, -2.2916259765625, -1.833740234375, -1.3758544921875, -0.91796875, -0.4600830078125, -0.002197265625, 0.4556884765625, 0.91357421875, 1.3714599609375, 1.829345703125, 2.2872314453125, 2.7451171875, 3.2030029296875, 3.660888671875, 4.1187744140625, 4.57666015625, 5.0345458984375, 5.492431640625, 5.9503173828125, 6.408203125, 6.8660888671875, 7.323974609375, 7.7818603515625, 8.23974609375, 8.6976318359375, 9.155517578125, 9.6134033203125, 10.0712890625, 10.5291748046875, 10.987060546875, 11.4449462890625, 11.90283203125, 12.3607177734375, 12.818603515625, 13.2764892578125, 13.734375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 4.0, 3.0, 6.0, 12.0, 15.0, 23.0, 21.0, 21.0, 33.0, 29.0, 65.0, 75.0, 142.0, 221.0, 394.0, 712.0, 1555.0, 3218.0, 7541.0, 18748.0, 52186.0, 168809.0, 483886.0, 210019.0, 62478.0, 22296.0, 8528.0, 3772.0, 1726.0, 844.0, 419.0, 235.0, 152.0, 86.0, 80.0, 46.0, 33.0, 26.0, 16.0, 19.0, 11.0, 10.0, 4.0, 8.0, 6.0, 7.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.4462890625, -1.4004974365234375, -1.354705810546875, -1.3089141845703125, -1.26312255859375, -1.2173309326171875, -1.171539306640625, -1.1257476806640625, -1.0799560546875, -1.0341644287109375, -0.988372802734375, -0.9425811767578125, -0.89678955078125, -0.8509979248046875, -0.805206298828125, -0.7594146728515625, -0.713623046875, -0.6678314208984375, -0.622039794921875, -0.5762481689453125, -0.53045654296875, -0.4846649169921875, -0.438873291015625, -0.3930816650390625, -0.3472900390625, -0.3014984130859375, -0.255706787109375, -0.2099151611328125, -0.16412353515625, -0.1183319091796875, -0.072540283203125, -0.0267486572265625, 0.01904296875, 0.0648345947265625, 0.110626220703125, 0.1564178466796875, 0.20220947265625, 0.2480010986328125, 0.293792724609375, 0.3395843505859375, 0.3853759765625, 0.4311676025390625, 0.476959228515625, 0.5227508544921875, 0.56854248046875, 0.6143341064453125, 0.660125732421875, 0.7059173583984375, 0.751708984375, 0.7975006103515625, 0.843292236328125, 0.8890838623046875, 0.93487548828125, 0.9806671142578125, 1.026458740234375, 1.0722503662109375, 1.1180419921875, 1.1638336181640625, 1.209625244140625, 1.2554168701171875, 1.30120849609375, 1.3470001220703125, 1.392791748046875, 1.4385833740234375, 1.484375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 5.0, 7.0, 12.0, 10.0, 10.0, 17.0, 13.0, 22.0, 14.0, 30.0, 24.0, 17.0, 36.0, 37.0, 37.0, 39.0, 38.0, 35.0, 34.0, 47.0, 1064.0, 35.0, 48.0, 41.0, 32.0, 43.0, 41.0, 28.0, 15.0, 27.0, 20.0, 24.0, 21.0, 8.0, 21.0, 13.0, 17.0, 10.0, 8.0, 4.0, 6.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7734375, -4.625244140625, -4.47705078125, -4.328857421875, -4.1806640625, -4.032470703125, -3.88427734375, -3.736083984375, -3.587890625, -3.439697265625, -3.29150390625, -3.143310546875, -2.9951171875, -2.846923828125, -2.69873046875, -2.550537109375, -2.40234375, -2.254150390625, -2.10595703125, -1.957763671875, -1.8095703125, -1.661376953125, -1.51318359375, -1.364990234375, -1.216796875, -1.068603515625, -0.92041015625, -0.772216796875, -0.6240234375, -0.475830078125, -0.32763671875, -0.179443359375, -0.03125, 0.116943359375, 0.26513671875, 0.413330078125, 0.5615234375, 0.709716796875, 0.85791015625, 1.006103515625, 1.154296875, 1.302490234375, 1.45068359375, 1.598876953125, 1.7470703125, 1.895263671875, 2.04345703125, 2.191650390625, 2.33984375, 2.488037109375, 2.63623046875, 2.784423828125, 2.9326171875, 3.080810546875, 3.22900390625, 3.377197265625, 3.525390625, 3.673583984375, 3.82177734375, 3.969970703125, 4.1181640625, 4.266357421875, 4.41455078125, 4.562744140625, 4.7109375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 5.0, 10.0, 16.0, 28.0, 34.0, 59.0, 62.0, 110.0, 181.0, 253.0, 407.0, 666.0, 1065.0, 1744.0, 2931.0, 4707.0, 7973.0, 13549.0, 23632.0, 42149.0, 78853.0, 159300.0, 1344241.0, 200474.0, 95962.0, 50841.0, 28097.0, 15965.0, 9359.0, 5614.0, 3454.0, 2041.0, 1275.0, 744.0, 480.0, 279.0, 185.0, 135.0, 82.0, 54.0, 32.0, 28.0, 15.0, 13.0, 10.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-0.87451171875, -0.849273681640625, -0.82403564453125, -0.798797607421875, -0.7735595703125, -0.748321533203125, -0.72308349609375, -0.697845458984375, -0.672607421875, -0.647369384765625, -0.62213134765625, -0.596893310546875, -0.5716552734375, -0.546417236328125, -0.52117919921875, -0.495941162109375, -0.470703125, -0.445465087890625, -0.42022705078125, -0.394989013671875, -0.3697509765625, -0.344512939453125, -0.31927490234375, -0.294036865234375, -0.268798828125, -0.243560791015625, -0.21832275390625, -0.193084716796875, -0.1678466796875, -0.142608642578125, -0.11737060546875, -0.092132568359375, -0.06689453125, -0.041656494140625, -0.01641845703125, 0.008819580078125, 0.0340576171875, 0.059295654296875, 0.08453369140625, 0.109771728515625, 0.135009765625, 0.160247802734375, 0.18548583984375, 0.210723876953125, 0.2359619140625, 0.261199951171875, 0.28643798828125, 0.311676025390625, 0.3369140625, 0.362152099609375, 0.38739013671875, 0.412628173828125, 0.4378662109375, 0.463104248046875, 0.48834228515625, 0.513580322265625, 0.538818359375, 0.564056396484375, 0.58929443359375, 0.614532470703125, 0.6397705078125, 0.665008544921875, 0.69024658203125, 0.715484619140625, 0.74072265625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 10.0, 11.0, 8.0, 10.0, 11.0, 18.0, 37.0, 24.0, 36.0, 47.0, 53.0, 66.0, 68.0, 90.0, 78.0, 67.0, 71.0, 58.0, 34.0, 38.0, 24.0, 36.0, 17.0, 18.0, 11.0, 11.0, 6.0, 4.0, 5.0, 1.0, 5.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002780914306640625, -0.0027021169662475586, -0.002623319625854492, -0.0025445222854614258, -0.0024657249450683594, -0.002386927604675293, -0.0023081302642822266, -0.00222933292388916, -0.0021505355834960938, -0.0020717382431030273, -0.001992940902709961, -0.0019141435623168945, -0.0018353462219238281, -0.0017565488815307617, -0.0016777515411376953, -0.001598954200744629, -0.0015201568603515625, -0.001441359519958496, -0.0013625621795654297, -0.0012837648391723633, -0.0012049674987792969, -0.0011261701583862305, -0.001047372817993164, -0.0009685754776000977, -0.0008897781372070312, -0.0008109807968139648, -0.0007321834564208984, -0.000653386116027832, -0.0005745887756347656, -0.0004957914352416992, -0.0004169940948486328, -0.0003381967544555664, -0.0002593994140625, -0.0001806020736694336, -0.00010180473327636719, -2.300739288330078e-05, 5.5789947509765625e-05, 0.00013458728790283203, 0.00021338462829589844, 0.00029218196868896484, 0.00037097930908203125, 0.00044977664947509766, 0.0005285739898681641, 0.0006073713302612305, 0.0006861686706542969, 0.0007649660110473633, 0.0008437633514404297, 0.0009225606918334961, 0.0010013580322265625, 0.001080155372619629, 0.0011589527130126953, 0.0012377500534057617, 0.0013165473937988281, 0.0013953447341918945, 0.001474142074584961, 0.0015529394149780273, 0.0016317367553710938, 0.0017105340957641602, 0.0017893314361572266, 0.001868128776550293, 0.0019469261169433594, 0.0020257234573364258, 0.002104520797729492, 0.0021833181381225586, 0.002262115478515625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 3.0, 5.0, 13.0, 15.0, 21.0, 17.0, 27.0, 30.0, 40.0, 50.0, 67.0, 86.0, 121.0, 150.0, 225.0, 312.0, 745.0, 92764.0, 951631.0, 975.0, 366.0, 210.0, 157.0, 124.0, 90.0, 59.0, 62.0, 38.0, 24.0, 29.0, 12.0, 13.0, 13.0, 13.0, 7.0, 5.0, 6.0, 10.0, 5.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.05206298828125, -0.0505366325378418, -0.049010276794433594, -0.04748392105102539, -0.04595756530761719, -0.044431209564208984, -0.04290485382080078, -0.04137849807739258, -0.039852142333984375, -0.03832578659057617, -0.03679943084716797, -0.035273075103759766, -0.03374671936035156, -0.03222036361694336, -0.030694007873535156, -0.029167652130126953, -0.02764129638671875, -0.026114940643310547, -0.024588584899902344, -0.02306222915649414, -0.021535873413085938, -0.020009517669677734, -0.01848316192626953, -0.016956806182861328, -0.015430450439453125, -0.013904094696044922, -0.012377738952636719, -0.010851383209228516, -0.009325027465820312, -0.007798671722412109, -0.006272315979003906, -0.004745960235595703, -0.0032196044921875, -0.0016932487487792969, -0.00016689300537109375, 0.0013594627380371094, 0.0028858184814453125, 0.004412174224853516, 0.005938529968261719, 0.007464885711669922, 0.008991241455078125, 0.010517597198486328, 0.012043952941894531, 0.013570308685302734, 0.015096664428710938, 0.01662302017211914, 0.018149375915527344, 0.019675731658935547, 0.02120208740234375, 0.022728443145751953, 0.024254798889160156, 0.02578115463256836, 0.027307510375976562, 0.028833866119384766, 0.03036022186279297, 0.03188657760620117, 0.033412933349609375, 0.03493928909301758, 0.03646564483642578, 0.037992000579833984, 0.03951835632324219, 0.04104471206665039, 0.042571067810058594, 0.0440974235534668, 0.045623779296875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 8.0, 24.0, 49.0, 152.0, 284.0, 270.0, 141.0, 52.0, 18.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.001782262697815895, -0.0017206696793437004, -0.0016590766608715057, -0.001597483758814633, -0.0015358907403424382, -0.0014742977218702435, -0.0014127048198133707, -0.001351111801341176, -0.0012895187828689814, -0.0012279257643967867, -0.001166332745924592, -0.0011047398438677192, -0.0010431468253955245, -0.0009815538069233298, -0.0009199608466587961, -0.0008583678863942623, -0.0007967748679220676, -0.000735181849449873, -0.0006735888891853392, -0.0006119959289208055, -0.0005504029104486108, -0.0004888098919764161, -0.00042721693171188235, -0.00036562394234351814, -0.0003040309529751539, -0.0002424379636067897, -0.0001808449742384255, -0.00011925198487006128, -5.7658995501697063e-05, 3.9339938666671515e-06, 6.552698323503137e-05, 0.00012711997260339558, 0.00018871319480240345, 0.00025030618417076766, 0.0003118991735391319, 0.0003734921629074961, 0.0004350851522758603, 0.000496678170748055, 0.0005582711310125887, 0.0006198640912771225, 0.0006814571097493172, 0.0007430501282215118, 0.0008046430884860456, 0.0008662360487505794, 0.000927829067222774, 0.0009894220856949687, 0.0010510149877518415, 0.0011126080062240362, 0.0011742010246962309, 0.0012357940431684256, 0.0012973870616406202, 0.001358979963697493, 0.0014205729821696877, 0.0014821660006418824, 0.0015437589026987553, 0.00160535192117095, 0.0016669449396431446, 0.0017285379581153393, 0.001790130976587534, 0.0018517238786444068, 0.0019133168971166015, 0.0019749097991734743, 0.002036502817645669, 0.0020980958361178637, 0.0021596888545900583]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 10.0, 7.0, 5.0, 4.0, 7.0, 13.0, 15.0, 18.0, 24.0, 27.0, 20.0, 15.0, 22.0, 26.0, 31.0, 44.0, 32.0, 36.0, 44.0, 38.0, 41.0, 32.0, 43.0, 41.0, 35.0, 23.0, 23.0, 37.0, 38.0, 27.0, 28.0, 30.0, 27.0, 21.0, 16.0, 10.0, 18.0, 11.0, 18.0, 9.0, 9.0, 5.0, 5.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.001181483268737793, -0.0011469339951872826, -0.0011123847216367722, -0.0010778354480862617, -0.0010432861745357513, -0.001008736900985241, -0.0009741876274347305, -0.0009396383538842201, -0.0009050890803337097, -0.0008705398067831993, -0.0008359905332326889, -0.0008014412596821785, -0.0007668919861316681, -0.0007323427125811577, -0.0006977934390306473, -0.0006632441654801369, -0.0006286948919296265, -0.0005941456183791161, -0.0005595963448286057, -0.0005250470712780952, -0.0004904977977275848, -0.00045594852417707443, -0.000421399250626564, -0.0003868499770760536, -0.0003523007035255432, -0.0003177514299750328, -0.0002832021564245224, -0.000248652882874012, -0.0002141036093235016, -0.00017955433577299118, -0.00014500506222248077, -0.00011045578867197037, -7.590651512145996e-05, -4.1357241570949554e-05, -6.807968020439148e-06, 2.774130553007126e-05, 6.229057908058167e-05, 9.683985263109207e-05, 0.00013138912618160248, 0.00016593839973211288, 0.0002004876732826233, 0.0002350369468331337, 0.0002695862203836441, 0.0003041354939341545, 0.0003386847674846649, 0.0003732340410351753, 0.00040778331458568573, 0.00044233258813619614, 0.00047688186168670654, 0.000511431135237217, 0.0005459804087877274, 0.0005805296823382378, 0.0006150789558887482, 0.0006496282294392586, 0.000684177502989769, 0.0007187267765402794, 0.0007532760500907898, 0.0007878253236413002, 0.0008223745971918106, 0.000856923870742321, 0.0008914731442928314, 0.0009260224178433418, 0.0009605716913938522, 0.0009951209649443626, 0.001029670238494873]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 10.0, 16.0, 21.0, 40.0, 42.0, 49.0, 63.0, 75.0, 71.0, 100.0, 96.0, 97.0, 73.0, 62.0, 58.0, 40.0, 37.0, 18.0, 10.0, 8.0, 3.0, 8.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.5703125, -15.1124267578125, -14.654541015625, -14.1966552734375, -13.73876953125, -13.2808837890625, -12.822998046875, -12.3651123046875, -11.9072265625, -11.4493408203125, -10.991455078125, -10.5335693359375, -10.07568359375, -9.6177978515625, -9.159912109375, -8.7020263671875, -8.244140625, -7.7862548828125, -7.328369140625, -6.8704833984375, -6.41259765625, -5.9547119140625, -5.496826171875, -5.0389404296875, -4.5810546875, -4.1231689453125, -3.665283203125, -3.2073974609375, -2.74951171875, -2.2916259765625, -1.833740234375, -1.3758544921875, -0.91796875, -0.4600830078125, -0.002197265625, 0.4556884765625, 0.91357421875, 1.3714599609375, 1.829345703125, 2.2872314453125, 2.7451171875, 3.2030029296875, 3.660888671875, 4.1187744140625, 4.57666015625, 5.0345458984375, 5.492431640625, 5.9503173828125, 6.408203125, 6.8660888671875, 7.323974609375, 7.7818603515625, 8.23974609375, 8.6976318359375, 9.155517578125, 9.6134033203125, 10.0712890625, 10.5291748046875, 10.987060546875, 11.4449462890625, 11.90283203125, 12.3607177734375, 12.818603515625, 13.2764892578125, 13.734375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 4.0, 9.0, 8.0, 16.0, 14.0, 27.0, 35.0, 76.0, 100.0, 185.0, 343.0, 643.0, 1329.0, 2659.0, 5741.0, 13768.0, 41457.0, 599941.0, 326554.0, 33786.0, 11825.0, 5178.0, 2321.0, 1121.0, 635.0, 331.0, 173.0, 91.0, 64.0, 32.0, 24.0, 16.0, 12.0, 12.0, 9.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.71875, -31.69384765625, -30.6689453125, -29.64404296875, -28.619140625, -27.59423828125, -26.5693359375, -25.54443359375, -24.51953125, -23.49462890625, -22.4697265625, -21.44482421875, -20.419921875, -19.39501953125, -18.3701171875, -17.34521484375, -16.3203125, -15.29541015625, -14.2705078125, -13.24560546875, -12.220703125, -11.19580078125, -10.1708984375, -9.14599609375, -8.12109375, -7.09619140625, -6.0712890625, -5.04638671875, -4.021484375, -2.99658203125, -1.9716796875, -0.94677734375, 0.078125, 1.10302734375, 2.1279296875, 3.15283203125, 4.177734375, 5.20263671875, 6.2275390625, 7.25244140625, 8.27734375, 9.30224609375, 10.3271484375, 11.35205078125, 12.376953125, 13.40185546875, 14.4267578125, 15.45166015625, 16.4765625, 17.50146484375, 18.5263671875, 19.55126953125, 20.576171875, 21.60107421875, 22.6259765625, 23.65087890625, 24.67578125, 25.70068359375, 26.7255859375, 27.75048828125, 28.775390625, 29.80029296875, 30.8251953125, 31.85009765625, 32.875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 11.0, 12.0, 11.0, 12.0, 15.0, 25.0, 18.0, 19.0, 23.0, 49.0, 36.0, 39.0, 54.0, 51.0, 81.0, 121.0, 1587.0, 286.0, 113.0, 59.0, 58.0, 50.0, 41.0, 34.0, 36.0, 28.0, 30.0, 23.0, 17.0, 16.0, 16.0, 12.0, 10.0, 11.0, 5.0, 4.0, 8.0, 3.0, 4.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.5, -21.71875, -20.9375, -20.15625, -19.375, -18.59375, -17.8125, -17.03125, -16.25, -15.46875, -14.6875, -13.90625, -13.125, -12.34375, -11.5625, -10.78125, -10.0, -9.21875, -8.4375, -7.65625, -6.875, -6.09375, -5.3125, -4.53125, -3.75, -2.96875, -2.1875, -1.40625, -0.625, 0.15625, 0.9375, 1.71875, 2.5, 3.28125, 4.0625, 4.84375, 5.625, 6.40625, 7.1875, 7.96875, 8.75, 9.53125, 10.3125, 11.09375, 11.875, 12.65625, 13.4375, 14.21875, 15.0, 15.78125, 16.5625, 17.34375, 18.125, 18.90625, 19.6875, 20.46875, 21.25, 22.03125, 22.8125, 23.59375, 24.375, 25.15625, 25.9375, 26.71875, 27.5]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 5.0, 9.0, 11.0, 9.0, 12.0, 11.0, 20.0, 21.0, 23.0, 22.0, 34.0, 38.0, 50.0, 73.0, 119.0, 253.0, 841.0, 28055.0, 3109451.0, 5556.0, 496.0, 199.0, 93.0, 50.0, 52.0, 48.0, 24.0, 16.0, 17.0, 22.0, 14.0, 11.0, 9.0, 10.0, 9.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-128.625, -124.986328125, -121.34765625, -117.708984375, -114.0703125, -110.431640625, -106.79296875, -103.154296875, -99.515625, -95.876953125, -92.23828125, -88.599609375, -84.9609375, -81.322265625, -77.68359375, -74.044921875, -70.40625, -66.767578125, -63.12890625, -59.490234375, -55.8515625, -52.212890625, -48.57421875, -44.935546875, -41.296875, -37.658203125, -34.01953125, -30.380859375, -26.7421875, -23.103515625, -19.46484375, -15.826171875, -12.1875, -8.548828125, -4.91015625, -1.271484375, 2.3671875, 6.005859375, 9.64453125, 13.283203125, 16.921875, 20.560546875, 24.19921875, 27.837890625, 31.4765625, 35.115234375, 38.75390625, 42.392578125, 46.03125, 49.669921875, 53.30859375, 56.947265625, 60.5859375, 64.224609375, 67.86328125, 71.501953125, 75.140625, 78.779296875, 82.41796875, 86.056640625, 89.6953125, 93.333984375, 96.97265625, 100.611328125, 104.25]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 967.0, 43.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.22358703613281, -89.59550476074219, -75.96742248535156, -62.33934783935547, -48.711265563964844, -35.08318328857422, -21.455108642578125, -7.8270263671875, 5.801055908203125, 19.429136276245117, 33.05721664428711, 46.68529510498047, 60.313377380371094, 73.94145965576172, 87.56953430175781, 101.19761657714844, 114.82569885253906, 128.4537811279297, 142.0818634033203, 155.70993041992188, 169.3380126953125, 182.96609497070312, 196.59417724609375, 210.22225952148438, 223.850341796875, 237.47842407226562, 251.10650634765625, 264.7345886230469, 278.3626708984375, 291.9907531738281, 305.61883544921875, 319.24688720703125, 332.875, 346.5030822753906, 360.13116455078125, 373.7592468261719, 387.3873291015625, 401.0154113769531, 414.64349365234375, 428.27154541015625, 441.899658203125, 455.5277404785156, 469.15582275390625, 482.7839050292969, 496.4119873046875, 510.0400695800781, 523.6681518554688, 537.2962036132812, 550.92431640625, 564.5523681640625, 578.1804809570312, 591.8085327148438, 605.4366455078125, 619.064697265625, 632.6928100585938, 646.3208618164062, 659.9489135742188, 673.5769653320312, 687.205078125, 700.8331298828125, 714.4612426757812, 728.0892944335938, 741.7174072265625, 755.345458984375, 768.9735717773438]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [5.0, 6.0, 1.0, 5.0, 2.0, 5.0, 2.0, 7.0, 8.0, 10.0, 8.0, 11.0, 17.0, 13.0, 15.0, 18.0, 15.0, 23.0, 20.0, 19.0, 28.0, 28.0, 28.0, 23.0, 37.0, 32.0, 29.0, 35.0, 37.0, 38.0, 31.0, 35.0, 41.0, 23.0, 37.0, 42.0, 31.0, 29.0, 26.0, 26.0, 25.0, 18.0, 24.0, 15.0, 15.0, 9.0, 4.0, 8.0, 10.0, 6.0, 9.0, 3.0, 11.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-52.39962387084961, -50.4113655090332, -48.4231071472168, -46.434844970703125, -44.44658660888672, -42.45832824707031, -40.470069885253906, -38.4818115234375, -36.493553161621094, -34.50529479980469, -32.51703643798828, -30.528776168823242, -28.540515899658203, -26.552257537841797, -24.56399917602539, -22.575740814208984, -20.587478637695312, -18.599220275878906, -16.610960006713867, -14.622701644897461, -12.634442329406738, -10.646183013916016, -8.65792465209961, -6.669665336608887, -4.681406021118164, -2.6931469440460205, -0.704887866973877, 1.2833709716796875, 3.27163028717041, 5.259889602661133, 7.248147964477539, 9.236407279968262, 11.224662780761719, 13.212922096252441, 15.201181411743164, 17.18943977355957, 19.17770004272461, 21.165958404541016, 23.154216766357422, 25.142475128173828, 27.130735397338867, 29.118993759155273, 31.107254028320312, 33.09551239013672, 35.083770751953125, 37.07202911376953, 39.06028747558594, 41.04854965209961, 43.036808013916016, 45.02506637573242, 47.01332473754883, 49.0015869140625, 50.989845275878906, 52.97810363769531, 54.96636199951172, 56.954620361328125, 58.94287872314453, 60.93113708496094, 62.919395446777344, 64.90765380859375, 66.89591217041016, 68.88417053222656, 70.8724365234375, 72.8606948852539, 74.84895324707031]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 4.0, 6.0, 13.0, 20.0, 20.0, 33.0, 43.0, 40.0, 62.0, 54.0, 74.0, 81.0, 92.0, 99.0, 65.0, 59.0, 69.0, 50.0, 36.0, 28.0, 23.0, 11.0, 9.0, 4.0, 6.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.106201171875, -13.65771484375, -13.209228515625, -12.7607421875, -12.312255859375, -11.86376953125, -11.415283203125, -10.966796875, -10.518310546875, -10.06982421875, -9.621337890625, -9.1728515625, -8.724365234375, -8.27587890625, -7.827392578125, -7.37890625, -6.930419921875, -6.48193359375, -6.033447265625, -5.5849609375, -5.136474609375, -4.68798828125, -4.239501953125, -3.791015625, -3.342529296875, -2.89404296875, -2.445556640625, -1.9970703125, -1.548583984375, -1.10009765625, -0.651611328125, -0.203125, 0.245361328125, 0.69384765625, 1.142333984375, 1.5908203125, 2.039306640625, 2.48779296875, 2.936279296875, 3.384765625, 3.833251953125, 4.28173828125, 4.730224609375, 5.1787109375, 5.627197265625, 6.07568359375, 6.524169921875, 6.97265625, 7.421142578125, 7.86962890625, 8.318115234375, 8.7666015625, 9.215087890625, 9.66357421875, 10.112060546875, 10.560546875, 11.009033203125, 11.45751953125, 11.906005859375, 12.3544921875, 12.802978515625, 13.25146484375, 13.699951171875, 14.1484375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 6.0, 6.0, 19.0, 17.0, 40.0, 54.0, 98.0, 167.0, 323.0, 704.0, 2149.0, 12165.0, 2652123.0, 1512107.0, 11095.0, 1897.0, 648.0, 289.0, 154.0, 91.0, 41.0, 32.0, 17.0, 13.0, 7.0, 9.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.3125, -76.90625, -74.5, -72.09375, -69.6875, -67.28125, -64.875, -62.46875, -60.0625, -57.65625, -55.25, -52.84375, -50.4375, -48.03125, -45.625, -43.21875, -40.8125, -38.40625, -36.0, -33.59375, -31.1875, -28.78125, -26.375, -23.96875, -21.5625, -19.15625, -16.75, -14.34375, -11.9375, -9.53125, -7.125, -4.71875, -2.3125, 0.09375, 2.5, 4.90625, 7.3125, 9.71875, 12.125, 14.53125, 16.9375, 19.34375, 21.75, 24.15625, 26.5625, 28.96875, 31.375, 33.78125, 36.1875, 38.59375, 41.0, 43.40625, 45.8125, 48.21875, 50.625, 53.03125, 55.4375, 57.84375, 60.25, 62.65625, 65.0625, 67.46875, 69.875, 72.28125, 74.6875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 6.0, 9.0, 16.0, 21.0, 36.0, 56.0, 114.0, 285.0, 901.0, 1400.0, 730.0, 242.0, 111.0, 57.0, 33.0, 24.0, 12.0, 8.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.40625, -58.69775390625, -56.9892578125, -55.28076171875, -53.572265625, -51.86376953125, -50.1552734375, -48.44677734375, -46.73828125, -45.02978515625, -43.3212890625, -41.61279296875, -39.904296875, -38.19580078125, -36.4873046875, -34.77880859375, -33.0703125, -31.36181640625, -29.6533203125, -27.94482421875, -26.236328125, -24.52783203125, -22.8193359375, -21.11083984375, -19.40234375, -17.69384765625, -15.9853515625, -14.27685546875, -12.568359375, -10.85986328125, -9.1513671875, -7.44287109375, -5.734375, -4.02587890625, -2.3173828125, -0.60888671875, 1.099609375, 2.80810546875, 4.5166015625, 6.22509765625, 7.93359375, 9.64208984375, 11.3505859375, 13.05908203125, 14.767578125, 16.47607421875, 18.1845703125, 19.89306640625, 21.6015625, 23.31005859375, 25.0185546875, 26.72705078125, 28.435546875, 30.14404296875, 31.8525390625, 33.56103515625, 35.26953125, 36.97802734375, 38.6865234375, 40.39501953125, 42.103515625, 43.81201171875, 45.5205078125, 47.22900390625, 48.9375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 13.0, 22.0, 36.0, 37.0, 67.0, 119.0, 151.0, 334.0, 652.0, 1975.0, 8321.0, 61327.0, 3901558.0, 199788.0, 15001.0, 3161.0, 877.0, 354.0, 204.0, 111.0, 69.0, 39.0, 30.0, 15.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.75, -61.056640625, -58.36328125, -55.669921875, -52.9765625, -50.283203125, -47.58984375, -44.896484375, -42.203125, -39.509765625, -36.81640625, -34.123046875, -31.4296875, -28.736328125, -26.04296875, -23.349609375, -20.65625, -17.962890625, -15.26953125, -12.576171875, -9.8828125, -7.189453125, -4.49609375, -1.802734375, 0.890625, 3.583984375, 6.27734375, 8.970703125, 11.6640625, 14.357421875, 17.05078125, 19.744140625, 22.4375, 25.130859375, 27.82421875, 30.517578125, 33.2109375, 35.904296875, 38.59765625, 41.291015625, 43.984375, 46.677734375, 49.37109375, 52.064453125, 54.7578125, 57.451171875, 60.14453125, 62.837890625, 65.53125, 68.224609375, 70.91796875, 73.611328125, 76.3046875, 78.998046875, 81.69140625, 84.384765625, 87.078125, 89.771484375, 92.46484375, 95.158203125, 97.8515625, 100.544921875, 103.23828125, 105.931640625, 108.625]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 9.0, 33.0, 330.0, 571.0, 65.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-263.22711181640625, -248.71951293945312, -234.2119140625, -219.70431518554688, -205.1967315673828, -190.6891326904297, -176.18153381347656, -161.6739501953125, -147.16635131835938, -132.65875244140625, -118.15116119384766, -103.64356231689453, -89.13597106933594, -74.62837219238281, -60.12077331542969, -45.613182067871094, -31.105575561523438, -16.597980499267578, -2.090383529663086, 12.417213439941406, 26.924808502197266, 41.432403564453125, 55.94000244140625, 70.44759368896484, 84.95519256591797, 99.4627914428711, 113.97038269042969, 128.4779815673828, 142.98558044433594, 157.4931640625, 172.00076293945312, 186.50836181640625, 201.01596069335938, 215.5235595703125, 230.03115844726562, 244.53875732421875, 259.0463562011719, 273.553955078125, 288.0615234375, 302.5691223144531, 317.07672119140625, 331.5843200683594, 346.0919189453125, 360.5995178222656, 375.10711669921875, 389.61468505859375, 404.122314453125, 418.6298828125, 433.13751220703125, 447.6451110839844, 462.1527099609375, 476.6603088378906, 491.16790771484375, 505.67547607421875, 520.18310546875, 534.690673828125, 549.1982421875, 563.705810546875, 578.2134399414062, 592.7210083007812, 607.2286376953125, 621.7362060546875, 636.2438354492188, 650.7514038085938, 665.259033203125]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 11.0, 8.0, 11.0, 10.0, 15.0, 18.0, 17.0, 25.0, 18.0, 23.0, 22.0, 33.0, 36.0, 44.0, 36.0, 48.0, 41.0, 39.0, 51.0, 33.0, 46.0, 36.0, 39.0, 43.0, 42.0, 45.0, 31.0, 23.0, 25.0, 20.0, 24.0, 10.0, 17.0, 11.0, 12.0, 6.0, 4.0, 5.0, 6.0, 9.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-94.09213256835938, -91.27352905273438, -88.45492553710938, -85.63632202148438, -82.81771850585938, -79.99911499023438, -77.18051147460938, -74.36190795898438, -71.54330444335938, -68.72470092773438, -65.90609741210938, -63.087493896484375, -60.268890380859375, -57.450286865234375, -54.631683349609375, -51.813079833984375, -48.99448013305664, -46.17587661743164, -43.35727310180664, -40.53866958618164, -37.72006607055664, -34.90146255493164, -32.082862854003906, -29.264257431030273, -26.445653915405273, -23.627050399780273, -20.808446884155273, -17.989845275878906, -15.17124080657959, -12.35263729095459, -9.534034729003906, -6.715431213378906, -3.8968276977539062, -1.0782244205474854, 1.7403788566589355, 4.558981895446777, 7.377585411071777, 10.196188926696777, 13.014791488647461, 15.833395004272461, 18.65199851989746, 21.47060203552246, 24.28920555114746, 27.107807159423828, 29.926410675048828, 32.74501419067383, 35.56361770629883, 38.38222122192383, 41.20082473754883, 44.01942825317383, 46.83803176879883, 49.65663528442383, 52.47523880004883, 55.29384231567383, 58.11244201660156, 60.93104553222656, 63.74964904785156, 66.56825256347656, 69.38685607910156, 72.20545959472656, 75.02406311035156, 77.84266662597656, 80.66127014160156, 83.47987365722656, 86.29847717285156]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 13.0, 14.0, 26.0, 26.0, 45.0, 55.0, 52.0, 48.0, 68.0, 67.0, 77.0, 72.0, 77.0, 67.0, 68.0, 49.0, 41.0, 34.0, 22.0, 20.0, 12.0, 8.0, 8.0, 5.0, 10.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3515625, -14.91015625, -14.46875, -14.02734375, -13.5859375, -13.14453125, -12.703125, -12.26171875, -11.8203125, -11.37890625, -10.9375, -10.49609375, -10.0546875, -9.61328125, -9.171875, -8.73046875, -8.2890625, -7.84765625, -7.40625, -6.96484375, -6.5234375, -6.08203125, -5.640625, -5.19921875, -4.7578125, -4.31640625, -3.875, -3.43359375, -2.9921875, -2.55078125, -2.109375, -1.66796875, -1.2265625, -0.78515625, -0.34375, 0.09765625, 0.5390625, 0.98046875, 1.421875, 1.86328125, 2.3046875, 2.74609375, 3.1875, 3.62890625, 4.0703125, 4.51171875, 4.953125, 5.39453125, 5.8359375, 6.27734375, 6.71875, 7.16015625, 7.6015625, 8.04296875, 8.484375, 8.92578125, 9.3671875, 9.80859375, 10.25, 10.69140625, 11.1328125, 11.57421875, 12.015625, 12.45703125, 12.8984375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 7.0, 4.0, 6.0, 12.0, 15.0, 18.0, 20.0, 31.0, 48.0, 70.0, 109.0, 141.0, 233.0, 414.0, 654.0, 1190.0, 2090.0, 3967.0, 8118.0, 16897.0, 36200.0, 84163.0, 236774.0, 399832.0, 148439.0, 57855.0, 25820.0, 12408.0, 6067.0, 2998.0, 1563.0, 940.0, 544.0, 304.0, 197.0, 123.0, 79.0, 51.0, 38.0, 25.0, 21.0, 15.0, 16.0, 13.0, 9.0, 7.0, 7.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.263671875, -1.2232818603515625, -1.182891845703125, -1.1425018310546875, -1.10211181640625, -1.0617218017578125, -1.021331787109375, -0.9809417724609375, -0.9405517578125, -0.9001617431640625, -0.859771728515625, -0.8193817138671875, -0.77899169921875, -0.7386016845703125, -0.698211669921875, -0.6578216552734375, -0.617431640625, -0.5770416259765625, -0.536651611328125, -0.4962615966796875, -0.45587158203125, -0.4154815673828125, -0.375091552734375, -0.3347015380859375, -0.2943115234375, -0.2539215087890625, -0.213531494140625, -0.1731414794921875, -0.13275146484375, -0.0923614501953125, -0.051971435546875, -0.0115814208984375, 0.02880859375, 0.0691986083984375, 0.109588623046875, 0.1499786376953125, 0.19036865234375, 0.2307586669921875, 0.271148681640625, 0.3115386962890625, 0.3519287109375, 0.3923187255859375, 0.432708740234375, 0.4730987548828125, 0.51348876953125, 0.5538787841796875, 0.594268798828125, 0.6346588134765625, 0.675048828125, 0.7154388427734375, 0.755828857421875, 0.7962188720703125, 0.83660888671875, 0.8769989013671875, 0.917388916015625, 0.9577789306640625, 0.9981689453125, 1.0385589599609375, 1.078948974609375, 1.1193389892578125, 1.15972900390625, 1.2001190185546875, 1.240509033203125, 1.2808990478515625, 1.3212890625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 6.0, 8.0, 9.0, 6.0, 10.0, 4.0, 16.0, 17.0, 28.0, 35.0, 40.0, 34.0, 34.0, 31.0, 46.0, 35.0, 48.0, 36.0, 41.0, 1070.0, 37.0, 42.0, 39.0, 36.0, 41.0, 26.0, 36.0, 30.0, 29.0, 20.0, 28.0, 24.0, 13.0, 11.0, 11.0, 11.0, 5.0, 6.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.9609375, -5.7813720703125, -5.601806640625, -5.4222412109375, -5.24267578125, -5.0631103515625, -4.883544921875, -4.7039794921875, -4.5244140625, -4.3448486328125, -4.165283203125, -3.9857177734375, -3.80615234375, -3.6265869140625, -3.447021484375, -3.2674560546875, -3.087890625, -2.9083251953125, -2.728759765625, -2.5491943359375, -2.36962890625, -2.1900634765625, -2.010498046875, -1.8309326171875, -1.6513671875, -1.4718017578125, -1.292236328125, -1.1126708984375, -0.93310546875, -0.7535400390625, -0.573974609375, -0.3944091796875, -0.21484375, -0.0352783203125, 0.144287109375, 0.3238525390625, 0.50341796875, 0.6829833984375, 0.862548828125, 1.0421142578125, 1.2216796875, 1.4012451171875, 1.580810546875, 1.7603759765625, 1.93994140625, 2.1195068359375, 2.299072265625, 2.4786376953125, 2.658203125, 2.8377685546875, 3.017333984375, 3.1968994140625, 3.37646484375, 3.5560302734375, 3.735595703125, 3.9151611328125, 4.0947265625, 4.2742919921875, 4.453857421875, 4.6334228515625, 4.81298828125, 4.9925537109375, 5.172119140625, 5.3516845703125, 5.53125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 9.0, 14.0, 15.0, 21.0, 23.0, 53.0, 63.0, 99.0, 150.0, 240.0, 379.0, 578.0, 937.0, 1504.0, 2568.0, 4197.0, 7400.0, 13109.0, 22460.0, 42068.0, 79999.0, 169687.0, 1368914.0, 190859.0, 87425.0, 45478.0, 24798.0, 14308.0, 8046.0, 4623.0, 2781.0, 1629.0, 998.0, 617.0, 382.0, 247.0, 156.0, 100.0, 59.0, 43.0, 32.0, 22.0, 11.0, 15.0, 8.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.96630859375, -0.9366378784179688, -0.9069671630859375, -0.8772964477539062, -0.847625732421875, -0.8179550170898438, -0.7882843017578125, -0.7586135864257812, -0.72894287109375, -0.6992721557617188, -0.6696014404296875, -0.6399307250976562, -0.610260009765625, -0.5805892944335938, -0.5509185791015625, -0.5212478637695312, -0.4915771484375, -0.46190643310546875, -0.4322357177734375, -0.40256500244140625, -0.372894287109375, -0.34322357177734375, -0.3135528564453125, -0.28388214111328125, -0.25421142578125, -0.22454071044921875, -0.1948699951171875, -0.16519927978515625, -0.135528564453125, -0.10585784912109375, -0.0761871337890625, -0.04651641845703125, -0.016845703125, 0.01282501220703125, 0.0424957275390625, 0.07216644287109375, 0.101837158203125, 0.13150787353515625, 0.1611785888671875, 0.19084930419921875, 0.22052001953125, 0.25019073486328125, 0.2798614501953125, 0.30953216552734375, 0.339202880859375, 0.36887359619140625, 0.3985443115234375, 0.42821502685546875, 0.4578857421875, 0.48755645751953125, 0.5172271728515625, 0.5468978881835938, 0.576568603515625, 0.6062393188476562, 0.6359100341796875, 0.6655807495117188, 0.69525146484375, 0.7249221801757812, 0.7545928955078125, 0.7842636108398438, 0.813934326171875, 0.8436050415039062, 0.8732757568359375, 0.9029464721679688, 0.9326171875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 4.0, 4.0, 7.0, 18.0, 11.0, 18.0, 19.0, 30.0, 42.0, 28.0, 52.0, 37.0, 58.0, 60.0, 49.0, 66.0, 78.0, 60.0, 54.0, 39.0, 56.0, 44.0, 21.0, 31.0, 19.0, 20.0, 15.0, 8.0, 11.0, 8.0, 8.0, 8.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.002407073974609375, -0.002341940999031067, -0.002276808023452759, -0.0022116750478744507, -0.0021465420722961426, -0.0020814090967178345, -0.0020162761211395264, -0.0019511431455612183, -0.0018860101699829102, -0.001820877194404602, -0.001755744218826294, -0.0016906112432479858, -0.0016254782676696777, -0.0015603452920913696, -0.0014952123165130615, -0.0014300793409347534, -0.0013649463653564453, -0.0012998133897781372, -0.001234680414199829, -0.001169547438621521, -0.0011044144630432129, -0.0010392814874649048, -0.0009741485118865967, -0.0009090155363082886, -0.0008438825607299805, -0.0007787495851516724, -0.0007136166095733643, -0.0006484836339950562, -0.000583350658416748, -0.0005182176828384399, -0.00045308470726013184, -0.00038795173168182373, -0.0003228187561035156, -0.0002576857805252075, -0.00019255280494689941, -0.0001274198293685913, -6.22868537902832e-05, 2.8461217880249023e-06, 6.797909736633301e-05, 0.0001331120729446411, 0.00019824504852294922, 0.0002633780241012573, 0.00032851099967956543, 0.00039364397525787354, 0.00045877695083618164, 0.0005239099264144897, 0.0005890429019927979, 0.000654175877571106, 0.0007193088531494141, 0.0007844418287277222, 0.0008495748043060303, 0.0009147077798843384, 0.0009798407554626465, 0.0010449737310409546, 0.0011101067066192627, 0.0011752396821975708, 0.001240372657775879, 0.001305505633354187, 0.0013706386089324951, 0.0014357715845108032, 0.0015009045600891113, 0.0015660375356674194, 0.0016311705112457275, 0.0016963034868240356, 0.0017614364624023438]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 4.0, 2.0, 8.0, 3.0, 7.0, 10.0, 18.0, 17.0, 21.0, 37.0, 33.0, 39.0, 60.0, 78.0, 81.0, 147.0, 154.0, 248.0, 384.0, 1059.0, 192536.0, 850288.0, 1867.0, 448.0, 202.0, 160.0, 158.0, 103.0, 96.0, 60.0, 50.0, 42.0, 26.0, 30.0, 20.0, 16.0, 10.0, 8.0, 5.0, 11.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03265380859375, -0.0314488410949707, -0.030243873596191406, -0.02903890609741211, -0.027833938598632812, -0.026628971099853516, -0.02542400360107422, -0.024219036102294922, -0.023014068603515625, -0.021809101104736328, -0.02060413360595703, -0.019399166107177734, -0.018194198608398438, -0.01698923110961914, -0.015784263610839844, -0.014579296112060547, -0.01337432861328125, -0.012169361114501953, -0.010964393615722656, -0.00975942611694336, -0.008554458618164062, -0.007349491119384766, -0.006144523620605469, -0.004939556121826172, -0.003734588623046875, -0.002529621124267578, -0.0013246536254882812, -0.00011968612670898438, 0.0010852813720703125, 0.0022902488708496094, 0.0034952163696289062, 0.004700183868408203, 0.0059051513671875, 0.007110118865966797, 0.008315086364746094, 0.00952005386352539, 0.010725021362304688, 0.011929988861083984, 0.013134956359863281, 0.014339923858642578, 0.015544891357421875, 0.016749858856201172, 0.01795482635498047, 0.019159793853759766, 0.020364761352539062, 0.02156972885131836, 0.022774696350097656, 0.023979663848876953, 0.02518463134765625, 0.026389598846435547, 0.027594566345214844, 0.02879953384399414, 0.030004501342773438, 0.031209468841552734, 0.03241443634033203, 0.03361940383911133, 0.034824371337890625, 0.03602933883666992, 0.03723430633544922, 0.038439273834228516, 0.03964424133300781, 0.04084920883178711, 0.042054176330566406, 0.0432591438293457, 0.044464111328125]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 44.0, 772.0, 195.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012429500930011272, -0.01215170044451952, -0.011873899027705193, -0.01159609854221344, -0.011318297125399113, -0.01104049663990736, -0.010762695223093033, -0.01048489473760128, -0.010207094252109528, -0.009929293766617775, -0.009651492349803448, -0.009373691864311695, -0.009095890447497368, -0.008818089962005615, -0.008540289476513863, -0.008262488059699535, -0.007984686642885208, -0.007706885691732168, -0.007429084740579128, -0.007151284255087376, -0.006873483303934336, -0.006595682352781296, -0.006317881401628256, -0.006040080450475216, -0.005762279964983463, -0.005484479013830423, -0.005206678062677383, -0.004928877577185631, -0.004651076626032591, -0.004373275674879551, -0.004095474723726511, -0.003817673772573471, -0.0035398732870817184, -0.0032620723359286785, -0.0029842716176062822, -0.0027064706664532423, -0.002428669948130846, -0.002150868996977806, -0.0018730680458247662, -0.001595267211087048, -0.00131746637634933, -0.0010396655416116118, -0.0007618646486662328, -0.0004840637557208538, -0.0002062629209831357, 7.15379137545824e-05, 0.00034933886490762234, 0.0006271396996453404, 0.0009049405343830585, 0.0011827413691207767, 0.0014605422038584948, 0.0017383431550115347, 0.002016143873333931, 0.002293944824486971, 0.002571745775640011, 0.0028495467267930508, 0.003127347445115447, 0.003405148396268487, 0.0036829491145908833, 0.003960750065743923, 0.004238551016896963, 0.004516351968050003, 0.004794152453541756, 0.005071953404694796, 0.0053497543558478355]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 7.0, 6.0, 7.0, 12.0, 9.0, 13.0, 18.0, 20.0, 22.0, 34.0, 30.0, 37.0, 39.0, 32.0, 53.0, 45.0, 38.0, 39.0, 36.0, 45.0, 50.0, 42.0, 48.0, 49.0, 37.0, 29.0, 33.0, 24.0, 21.0, 22.0, 25.0, 15.0, 17.0, 12.0, 12.0, 3.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0012550950050354004, -0.0012208754196763039, -0.0011866558343172073, -0.0011524362489581108, -0.0011182166635990143, -0.0010839970782399178, -0.0010497774928808212, -0.0010155579075217247, -0.0009813383221626282, -0.0009471187368035316, -0.0009128991514444351, -0.0008786795660853386, -0.0008444599807262421, -0.0008102403953671455, -0.000776020810008049, -0.0007418012246489525, -0.000707581639289856, -0.0006733620539307594, -0.0006391424685716629, -0.0006049228832125664, -0.0005707032978534698, -0.0005364837124943733, -0.0005022641271352768, -0.00046804454177618027, -0.00043382495641708374, -0.0003996053710579872, -0.0003653857856988907, -0.00033116620033979416, -0.00029694661498069763, -0.0002627270296216011, -0.00022850744426250458, -0.00019428785890340805, -0.00016006827354431152, -0.000125848688185215, -9.162910282611847e-05, -5.740951746702194e-05, -2.3189932107925415e-05, 1.1029653251171112e-05, 4.524923861026764e-05, 7.946882396936417e-05, 0.0001136884093284607, 0.00014790799468755722, 0.00018212758004665375, 0.00021634716540575027, 0.0002505667507648468, 0.00028478633612394333, 0.00031900592148303986, 0.0003532255068421364, 0.0003874450922012329, 0.00042166467756032944, 0.00045588426291942596, 0.0004901038482785225, 0.000524323433637619, 0.0005585430189967155, 0.0005927626043558121, 0.0006269821897149086, 0.0006612017750740051, 0.0006954213604331017, 0.0007296409457921982, 0.0007638605311512947, 0.0007980801165103912, 0.0008322997018694878, 0.0008665192872285843, 0.0009007388725876808, 0.0009349584579467773]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 9.0, 13.0, 14.0, 26.0, 26.0, 45.0, 55.0, 52.0, 48.0, 68.0, 67.0, 77.0, 72.0, 77.0, 67.0, 68.0, 49.0, 41.0, 34.0, 22.0, 20.0, 12.0, 8.0, 8.0, 5.0, 10.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3515625, -14.91015625, -14.46875, -14.02734375, -13.5859375, -13.14453125, -12.703125, -12.26171875, -11.8203125, -11.37890625, -10.9375, -10.49609375, -10.0546875, -9.61328125, -9.171875, -8.73046875, -8.2890625, -7.84765625, -7.40625, -6.96484375, -6.5234375, -6.08203125, -5.640625, -5.19921875, -4.7578125, -4.31640625, -3.875, -3.43359375, -2.9921875, -2.55078125, -2.109375, -1.66796875, -1.2265625, -0.78515625, -0.34375, 0.09765625, 0.5390625, 0.98046875, 1.421875, 1.86328125, 2.3046875, 2.74609375, 3.1875, 3.62890625, 4.0703125, 4.51171875, 4.953125, 5.39453125, 5.8359375, 6.27734375, 6.71875, 7.16015625, 7.6015625, 8.04296875, 8.484375, 8.92578125, 9.3671875, 9.80859375, 10.25, 10.69140625, 11.1328125, 11.57421875, 12.015625, 12.45703125, 12.8984375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 4.0, 3.0, 4.0, 8.0, 12.0, 15.0, 23.0, 42.0, 37.0, 99.0, 150.0, 234.0, 413.0, 806.0, 1664.0, 4573.0, 18629.0, 151634.0, 760275.0, 90137.0, 13187.0, 3610.0, 1387.0, 674.0, 342.0, 227.0, 127.0, 80.0, 60.0, 31.0, 23.0, 18.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.1328125, -13.7095947265625, -13.286376953125, -12.8631591796875, -12.43994140625, -12.0167236328125, -11.593505859375, -11.1702880859375, -10.7470703125, -10.3238525390625, -9.900634765625, -9.4774169921875, -9.05419921875, -8.6309814453125, -8.207763671875, -7.7845458984375, -7.361328125, -6.9381103515625, -6.514892578125, -6.0916748046875, -5.66845703125, -5.2452392578125, -4.822021484375, -4.3988037109375, -3.9755859375, -3.5523681640625, -3.129150390625, -2.7059326171875, -2.28271484375, -1.8594970703125, -1.436279296875, -1.0130615234375, -0.58984375, -0.1666259765625, 0.256591796875, 0.6798095703125, 1.10302734375, 1.5262451171875, 1.949462890625, 2.3726806640625, 2.7958984375, 3.2191162109375, 3.642333984375, 4.0655517578125, 4.48876953125, 4.9119873046875, 5.335205078125, 5.7584228515625, 6.181640625, 6.6048583984375, 7.028076171875, 7.4512939453125, 7.87451171875, 8.2977294921875, 8.720947265625, 9.1441650390625, 9.5673828125, 9.9906005859375, 10.413818359375, 10.8370361328125, 11.26025390625, 11.6834716796875, 12.106689453125, 12.5299072265625, 12.953125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 7.0, 5.0, 3.0, 9.0, 7.0, 10.0, 18.0, 18.0, 19.0, 18.0, 23.0, 23.0, 20.0, 24.0, 33.0, 34.0, 33.0, 40.0, 42.0, 43.0, 42.0, 190.0, 1888.0, 89.0, 48.0, 29.0, 35.0, 37.0, 33.0, 34.0, 23.0, 21.0, 20.0, 27.0, 9.0, 20.0, 15.0, 17.0, 8.0, 8.0, 11.0, 7.0, 9.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.984375, -28.058837890625, -27.13330078125, -26.207763671875, -25.2822265625, -24.356689453125, -23.43115234375, -22.505615234375, -21.580078125, -20.654541015625, -19.72900390625, -18.803466796875, -17.8779296875, -16.952392578125, -16.02685546875, -15.101318359375, -14.17578125, -13.250244140625, -12.32470703125, -11.399169921875, -10.4736328125, -9.548095703125, -8.62255859375, -7.697021484375, -6.771484375, -5.845947265625, -4.92041015625, -3.994873046875, -3.0693359375, -2.143798828125, -1.21826171875, -0.292724609375, 0.6328125, 1.558349609375, 2.48388671875, 3.409423828125, 4.3349609375, 5.260498046875, 6.18603515625, 7.111572265625, 8.037109375, 8.962646484375, 9.88818359375, 10.813720703125, 11.7392578125, 12.664794921875, 13.59033203125, 14.515869140625, 15.44140625, 16.366943359375, 17.29248046875, 18.218017578125, 19.1435546875, 20.069091796875, 20.99462890625, 21.920166015625, 22.845703125, 23.771240234375, 24.69677734375, 25.622314453125, 26.5478515625, 27.473388671875, 28.39892578125, 29.324462890625, 30.25]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 10.0, 7.0, 9.0, 8.0, 19.0, 17.0, 16.0, 19.0, 25.0, 24.0, 28.0, 43.0, 50.0, 76.0, 91.0, 164.0, 386.0, 1082.0, 76512.0, 3063612.0, 2129.0, 578.0, 222.0, 130.0, 91.0, 57.0, 48.0, 41.0, 21.0, 30.0, 18.0, 25.0, 21.0, 16.0, 19.0, 12.0, 8.0, 8.0, 5.0, 3.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-69.5, -67.3408203125, -65.181640625, -63.0224609375, -60.86328125, -58.7041015625, -56.544921875, -54.3857421875, -52.2265625, -50.0673828125, -47.908203125, -45.7490234375, -43.58984375, -41.4306640625, -39.271484375, -37.1123046875, -34.953125, -32.7939453125, -30.634765625, -28.4755859375, -26.31640625, -24.1572265625, -21.998046875, -19.8388671875, -17.6796875, -15.5205078125, -13.361328125, -11.2021484375, -9.04296875, -6.8837890625, -4.724609375, -2.5654296875, -0.40625, 1.7529296875, 3.912109375, 6.0712890625, 8.23046875, 10.3896484375, 12.548828125, 14.7080078125, 16.8671875, 19.0263671875, 21.185546875, 23.3447265625, 25.50390625, 27.6630859375, 29.822265625, 31.9814453125, 34.140625, 36.2998046875, 38.458984375, 40.6181640625, 42.77734375, 44.9365234375, 47.095703125, 49.2548828125, 51.4140625, 53.5732421875, 55.732421875, 57.8916015625, 60.05078125, 62.2099609375, 64.369140625, 66.5283203125, 68.6875]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 49.0, 680.0, 283.0, 6.0], "bins": [-212.4017333984375, -208.96383666992188, -205.52593994140625, -202.08804321289062, -198.650146484375, -195.21224975585938, -191.7743682861328, -188.3364715576172, -184.89857482910156, -181.46067810058594, -178.0227813720703, -174.5848846435547, -171.14698791503906, -167.7091064453125, -164.27120971679688, -160.83331298828125, -157.39541625976562, -153.95751953125, -150.51962280273438, -147.08172607421875, -143.64382934570312, -140.2059326171875, -136.76805114746094, -133.3301544189453, -129.8922576904297, -126.45436096191406, -123.01646423339844, -119.57857513427734, -116.14067840576172, -112.7027816772461, -109.26488494873047, -105.82699584960938, -102.38909912109375, -98.95120239257812, -95.5133056640625, -92.0754165649414, -88.63751983642578, -85.19962310791016, -81.76172637939453, -78.32383728027344, -74.88593292236328, -71.44803619384766, -68.01013946533203, -64.57225036621094, -61.13435363769531, -57.69645690917969, -54.25856018066406, -50.8206672668457, -47.382774353027344, -43.94487762451172, -40.50698471069336, -37.069087982177734, -33.631195068359375, -30.19329833984375, -26.755403518676758, -23.317508697509766, -19.879613876342773, -16.44171905517578, -13.003824234008789, -9.56592845916748, -6.128033638000488, -2.6901378631591797, 0.7477569580078125, 4.185651779174805, 7.623546123504639]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 8.0, 4.0, 2.0, 4.0, 12.0, 8.0, 13.0, 6.0, 10.0, 20.0, 22.0, 27.0, 17.0, 32.0, 26.0, 35.0, 39.0, 36.0, 38.0, 35.0, 49.0, 41.0, 33.0, 40.0, 42.0, 44.0, 37.0, 30.0, 33.0, 35.0, 29.0, 32.0, 32.0, 24.0, 17.0, 15.0, 9.0, 9.0, 13.0, 8.0, 11.0, 8.0, 3.0, 3.0, 4.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.19054412841797, -95.18575286865234, -92.18096923828125, -89.17617797851562, -86.17139434814453, -83.1666030883789, -80.16181945800781, -77.15702819824219, -74.15223693847656, -71.14744567871094, -68.14266204833984, -65.13787078857422, -62.13308334350586, -59.1282958984375, -56.12350845336914, -53.11872100830078, -50.11393356323242, -47.10914611816406, -44.1043586730957, -41.099571228027344, -38.09477996826172, -35.08999252319336, -32.085205078125, -29.080415725708008, -26.07562828063965, -23.07084083557129, -20.066051483154297, -17.061264038085938, -14.056475639343262, -11.051687240600586, -8.046899795532227, -5.042110443115234, -2.037322998046875, 0.9674651622772217, 3.9722533226013184, 6.977041244506836, 9.981829643249512, 12.986618041992188, 15.991405487060547, 18.99619483947754, 22.0009822845459, 25.005769729614258, 28.01055908203125, 31.01534652709961, 34.02013397216797, 37.024925231933594, 40.02970886230469, 43.03450012207031, 46.03928756713867, 49.04407501220703, 52.04886245727539, 55.05364990234375, 58.058441162109375, 61.063228607177734, 64.0680160522461, 67.07280731201172, 70.07759094238281, 73.08238220214844, 76.08716583251953, 79.09195709228516, 82.09674072265625, 85.10153198242188, 88.1063232421875, 91.1111068725586, 94.11589813232422]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 12.0, 11.0, 18.0, 20.0, 33.0, 41.0, 43.0, 56.0, 48.0, 69.0, 59.0, 83.0, 73.0, 69.0, 73.0, 62.0, 59.0, 32.0, 39.0, 22.0, 19.0, 20.0, 9.0, 7.0, 4.0, 10.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3984375, -14.9573974609375, -14.516357421875, -14.0753173828125, -13.63427734375, -13.1932373046875, -12.752197265625, -12.3111572265625, -11.8701171875, -11.4290771484375, -10.988037109375, -10.5469970703125, -10.10595703125, -9.6649169921875, -9.223876953125, -8.7828369140625, -8.341796875, -7.9007568359375, -7.459716796875, -7.0186767578125, -6.57763671875, -6.1365966796875, -5.695556640625, -5.2545166015625, -4.8134765625, -4.3724365234375, -3.931396484375, -3.4903564453125, -3.04931640625, -2.6082763671875, -2.167236328125, -1.7261962890625, -1.28515625, -0.8441162109375, -0.403076171875, 0.0379638671875, 0.47900390625, 0.9200439453125, 1.361083984375, 1.8021240234375, 2.2431640625, 2.6842041015625, 3.125244140625, 3.5662841796875, 4.00732421875, 4.4483642578125, 4.889404296875, 5.3304443359375, 5.771484375, 6.2125244140625, 6.653564453125, 7.0946044921875, 7.53564453125, 7.9766845703125, 8.417724609375, 8.8587646484375, 9.2998046875, 9.7408447265625, 10.181884765625, 10.6229248046875, 11.06396484375, 11.5050048828125, 11.946044921875, 12.3870849609375, 12.828125]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 13.0, 20.0, 19.0, 30.0, 49.0, 67.0, 122.0, 262.0, 703.0, 3627.0, 875043.0, 3308027.0, 4876.0, 842.0, 248.0, 120.0, 74.0, 36.0, 35.0, 19.0, 18.0, 10.0, 4.0, 6.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.5625, -113.3310546875, -110.099609375, -106.8681640625, -103.63671875, -100.4052734375, -97.173828125, -93.9423828125, -90.7109375, -87.4794921875, -84.248046875, -81.0166015625, -77.78515625, -74.5537109375, -71.322265625, -68.0908203125, -64.859375, -61.6279296875, -58.396484375, -55.1650390625, -51.93359375, -48.7021484375, -45.470703125, -42.2392578125, -39.0078125, -35.7763671875, -32.544921875, -29.3134765625, -26.08203125, -22.8505859375, -19.619140625, -16.3876953125, -13.15625, -9.9248046875, -6.693359375, -3.4619140625, -0.23046875, 3.0009765625, 6.232421875, 9.4638671875, 12.6953125, 15.9267578125, 19.158203125, 22.3896484375, 25.62109375, 28.8525390625, 32.083984375, 35.3154296875, 38.546875, 41.7783203125, 45.009765625, 48.2412109375, 51.47265625, 54.7041015625, 57.935546875, 61.1669921875, 64.3984375, 67.6298828125, 70.861328125, 74.0927734375, 77.32421875, 80.5556640625, 83.787109375, 87.0185546875, 90.25]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 1.0, 12.0, 14.0, 14.0, 16.0, 30.0, 33.0, 71.0, 141.0, 349.0, 728.0, 1038.0, 821.0, 405.0, 160.0, 92.0, 42.0, 26.0, 24.0, 12.0, 6.0, 10.0, 11.0, 1.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.296875, -26.087158203125, -24.87744140625, -23.667724609375, -22.4580078125, -21.248291015625, -20.03857421875, -18.828857421875, -17.619140625, -16.409423828125, -15.19970703125, -13.989990234375, -12.7802734375, -11.570556640625, -10.36083984375, -9.151123046875, -7.94140625, -6.731689453125, -5.52197265625, -4.312255859375, -3.1025390625, -1.892822265625, -0.68310546875, 0.526611328125, 1.736328125, 2.946044921875, 4.15576171875, 5.365478515625, 6.5751953125, 7.784912109375, 8.99462890625, 10.204345703125, 11.4140625, 12.623779296875, 13.83349609375, 15.043212890625, 16.2529296875, 17.462646484375, 18.67236328125, 19.882080078125, 21.091796875, 22.301513671875, 23.51123046875, 24.720947265625, 25.9306640625, 27.140380859375, 28.35009765625, 29.559814453125, 30.76953125, 31.979248046875, 33.18896484375, 34.398681640625, 35.6083984375, 36.818115234375, 38.02783203125, 39.237548828125, 40.447265625, 41.656982421875, 42.86669921875, 44.076416015625, 45.2861328125, 46.495849609375, 47.70556640625, 48.915283203125, 50.125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 4.0, 7.0, 12.0, 15.0, 21.0, 31.0, 46.0, 75.0, 138.0, 210.0, 414.0, 790.0, 1459.0, 3106.0, 8096.0, 25337.0, 199978.0, 3702251.0, 211896.0, 25839.0, 8046.0, 3243.0, 1500.0, 758.0, 418.0, 232.0, 129.0, 69.0, 50.0, 30.0, 20.0, 19.0, 11.0, 14.0, 7.0, 4.0, 8.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.9375, -55.333984375, -53.73046875, -52.126953125, -50.5234375, -48.919921875, -47.31640625, -45.712890625, -44.109375, -42.505859375, -40.90234375, -39.298828125, -37.6953125, -36.091796875, -34.48828125, -32.884765625, -31.28125, -29.677734375, -28.07421875, -26.470703125, -24.8671875, -23.263671875, -21.66015625, -20.056640625, -18.453125, -16.849609375, -15.24609375, -13.642578125, -12.0390625, -10.435546875, -8.83203125, -7.228515625, -5.625, -4.021484375, -2.41796875, -0.814453125, 0.7890625, 2.392578125, 3.99609375, 5.599609375, 7.203125, 8.806640625, 10.41015625, 12.013671875, 13.6171875, 15.220703125, 16.82421875, 18.427734375, 20.03125, 21.634765625, 23.23828125, 24.841796875, 26.4453125, 28.048828125, 29.65234375, 31.255859375, 32.859375, 34.462890625, 36.06640625, 37.669921875, 39.2734375, 40.876953125, 42.48046875, 44.083984375, 45.6875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 17.0, 43.0, 166.0, 357.0, 269.0, 95.0, 31.0, 14.0, 7.0, 3.0, 3.0], "bins": [-399.72552490234375, -392.69146728515625, -385.65740966796875, -378.6233215332031, -371.5892639160156, -364.5552062988281, -357.5211486816406, -350.487060546875, -343.4530029296875, -336.4189453125, -329.3848876953125, -322.3507995605469, -315.3167419433594, -308.2826843261719, -301.2486267089844, -294.21453857421875, -287.18048095703125, -280.14642333984375, -273.11236572265625, -266.0782775878906, -259.0442199707031, -252.01016235351562, -244.97610473632812, -237.94203186035156, -230.90798950195312, -223.87393188476562, -216.83985900878906, -209.80580139160156, -202.771728515625, -195.7376708984375, -188.70361328125, -181.66954040527344, -174.63548278808594, -167.60142517089844, -160.56735229492188, -153.53329467773438, -146.4992218017578, -139.4651641845703, -132.43109130859375, -125.39703369140625, -118.36296844482422, -111.32890319824219, -104.29483795166016, -97.26077270507812, -90.22671508789062, -83.19264221191406, -76.15858459472656, -69.12451934814453, -62.0904541015625, -55.05638885498047, -48.02232360839844, -40.98826217651367, -33.95419692993164, -26.92013168334961, -19.886070251464844, -12.852005004882812, -5.817939758300781, 1.2161245346069336, 8.250188827514648, 15.284252166748047, 22.318317413330078, 29.35238265991211, 36.386444091796875, 43.420509338378906, 50.45457458496094]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 3.0, 4.0, 8.0, 2.0, 3.0, 10.0, 14.0, 12.0, 15.0, 25.0, 16.0, 21.0, 18.0, 19.0, 24.0, 41.0, 25.0, 27.0, 42.0, 39.0, 45.0, 40.0, 44.0, 58.0, 37.0, 47.0, 43.0, 35.0, 35.0, 25.0, 33.0, 35.0, 18.0, 16.0, 18.0, 20.0, 18.0, 15.0, 5.0, 9.0, 7.0, 7.0, 5.0, 5.0, 3.0, 3.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-75.62722778320312, -73.33653259277344, -71.04582977294922, -68.75513458251953, -66.46443176269531, -64.17373657226562, -61.88304138183594, -59.592342376708984, -57.30164337158203, -55.01094436645508, -52.720245361328125, -50.42955017089844, -48.138851165771484, -45.84815216064453, -43.557456970214844, -41.26675796508789, -38.97605895996094, -36.685359954833984, -34.39466094970703, -32.103965759277344, -29.81326675415039, -27.522567749023438, -25.231870651245117, -22.941173553466797, -20.650474548339844, -18.35977554321289, -16.06907844543457, -13.778380393981934, -11.487682342529297, -9.19698429107666, -6.906286239624023, -4.615589141845703, -2.3248977661132812, -0.03419971466064453, 2.256498336791992, 4.547196388244629, 6.837894439697266, 9.128592491149902, 11.419290542602539, 13.70998764038086, 16.000686645507812, 18.291385650634766, 20.582082748413086, 22.872779846191406, 25.16347885131836, 27.454177856445312, 29.744874954223633, 32.03557205200195, 34.326271057128906, 36.61697006225586, 38.90766906738281, 41.1983642578125, 43.48906326293945, 45.779762268066406, 48.070457458496094, 50.36115646362305, 52.65185546875, 54.94255447387695, 57.233253479003906, 59.523948669433594, 61.81464767456055, 64.1053466796875, 66.39604187011719, 68.68673706054688, 70.9774398803711]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 10.0, 7.0, 21.0, 31.0, 30.0, 35.0, 41.0, 46.0, 51.0, 51.0, 66.0, 72.0, 64.0, 72.0, 60.0, 53.0, 68.0, 54.0, 32.0, 27.0, 21.0, 18.0, 18.0, 16.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.642822265625, -13.20751953125, -12.772216796875, -12.3369140625, -11.901611328125, -11.46630859375, -11.031005859375, -10.595703125, -10.160400390625, -9.72509765625, -9.289794921875, -8.8544921875, -8.419189453125, -7.98388671875, -7.548583984375, -7.11328125, -6.677978515625, -6.24267578125, -5.807373046875, -5.3720703125, -4.936767578125, -4.50146484375, -4.066162109375, -3.630859375, -3.195556640625, -2.76025390625, -2.324951171875, -1.8896484375, -1.454345703125, -1.01904296875, -0.583740234375, -0.1484375, 0.286865234375, 0.72216796875, 1.157470703125, 1.5927734375, 2.028076171875, 2.46337890625, 2.898681640625, 3.333984375, 3.769287109375, 4.20458984375, 4.639892578125, 5.0751953125, 5.510498046875, 5.94580078125, 6.381103515625, 6.81640625, 7.251708984375, 7.68701171875, 8.122314453125, 8.5576171875, 8.992919921875, 9.42822265625, 9.863525390625, 10.298828125, 10.734130859375, 11.16943359375, 11.604736328125, 12.0400390625, 12.475341796875, 12.91064453125, 13.345947265625, 13.78125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 9.0, 14.0, 19.0, 16.0, 35.0, 53.0, 63.0, 103.0, 158.0, 259.0, 380.0, 623.0, 1014.0, 1704.0, 3059.0, 5532.0, 10534.0, 21313.0, 44100.0, 100179.0, 253779.0, 345809.0, 141274.0, 60415.0, 28055.0, 13775.0, 6908.0, 3879.0, 2135.0, 1268.0, 744.0, 478.0, 277.0, 197.0, 130.0, 81.0, 51.0, 30.0, 21.0, 20.0, 11.0, 14.0, 11.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1845703125, -1.1453399658203125, -1.106109619140625, -1.0668792724609375, -1.02764892578125, -0.9884185791015625, -0.949188232421875, -0.9099578857421875, -0.8707275390625, -0.8314971923828125, -0.792266845703125, -0.7530364990234375, -0.71380615234375, -0.6745758056640625, -0.635345458984375, -0.5961151123046875, -0.556884765625, -0.5176544189453125, -0.478424072265625, -0.4391937255859375, -0.39996337890625, -0.3607330322265625, -0.321502685546875, -0.2822723388671875, -0.2430419921875, -0.2038116455078125, -0.164581298828125, -0.1253509521484375, -0.08612060546875, -0.0468902587890625, -0.007659912109375, 0.0315704345703125, 0.07080078125, 0.1100311279296875, 0.149261474609375, 0.1884918212890625, 0.22772216796875, 0.2669525146484375, 0.306182861328125, 0.3454132080078125, 0.3846435546875, 0.4238739013671875, 0.463104248046875, 0.5023345947265625, 0.54156494140625, 0.5807952880859375, 0.620025634765625, 0.6592559814453125, 0.698486328125, 0.7377166748046875, 0.776947021484375, 0.8161773681640625, 0.85540771484375, 0.8946380615234375, 0.933868408203125, 0.9730987548828125, 1.0123291015625, 1.0515594482421875, 1.090789794921875, 1.1300201416015625, 1.16925048828125, 1.2084808349609375, 1.247711181640625, 1.2869415283203125, 1.326171875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 8.0, 10.0, 12.0, 20.0, 9.0, 11.0, 12.0, 25.0, 27.0, 22.0, 26.0, 32.0, 32.0, 38.0, 29.0, 39.0, 34.0, 43.0, 41.0, 1068.0, 39.0, 41.0, 37.0, 39.0, 33.0, 30.0, 34.0, 27.0, 24.0, 20.0, 28.0, 25.0, 19.0, 16.0, 14.0, 17.0, 6.0, 12.0, 6.0, 6.0, 6.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-6.09375, -5.91119384765625, -5.7286376953125, -5.54608154296875, -5.363525390625, -5.18096923828125, -4.9984130859375, -4.81585693359375, -4.63330078125, -4.45074462890625, -4.2681884765625, -4.08563232421875, -3.903076171875, -3.72052001953125, -3.5379638671875, -3.35540771484375, -3.1728515625, -2.99029541015625, -2.8077392578125, -2.62518310546875, -2.442626953125, -2.26007080078125, -2.0775146484375, -1.89495849609375, -1.71240234375, -1.52984619140625, -1.3472900390625, -1.16473388671875, -0.982177734375, -0.79962158203125, -0.6170654296875, -0.43450927734375, -0.251953125, -0.06939697265625, 0.1131591796875, 0.29571533203125, 0.478271484375, 0.66082763671875, 0.8433837890625, 1.02593994140625, 1.20849609375, 1.39105224609375, 1.5736083984375, 1.75616455078125, 1.938720703125, 2.12127685546875, 2.3038330078125, 2.48638916015625, 2.6689453125, 2.85150146484375, 3.0340576171875, 3.21661376953125, 3.399169921875, 3.58172607421875, 3.7642822265625, 3.94683837890625, 4.12939453125, 4.31195068359375, 4.4945068359375, 4.67706298828125, 4.859619140625, 5.04217529296875, 5.2247314453125, 5.40728759765625, 5.58984375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 14.0, 15.0, 12.0, 25.0, 46.0, 53.0, 84.0, 102.0, 165.0, 257.0, 419.0, 593.0, 935.0, 1513.0, 2252.0, 3637.0, 5992.0, 10204.0, 17144.0, 29630.0, 54605.0, 105004.0, 221500.0, 1332771.0, 145099.0, 71976.0, 38709.0, 21632.0, 12551.0, 7636.0, 4687.0, 2786.0, 1786.0, 1180.0, 715.0, 470.0, 311.0, 199.0, 132.0, 78.0, 65.0, 41.0, 32.0, 21.0, 14.0, 7.0, 7.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.91796875, -0.8885650634765625, -0.859161376953125, -0.8297576904296875, -0.80035400390625, -0.7709503173828125, -0.741546630859375, -0.7121429443359375, -0.6827392578125, -0.6533355712890625, -0.623931884765625, -0.5945281982421875, -0.56512451171875, -0.5357208251953125, -0.506317138671875, -0.4769134521484375, -0.447509765625, -0.4181060791015625, -0.388702392578125, -0.3592987060546875, -0.32989501953125, -0.3004913330078125, -0.271087646484375, -0.2416839599609375, -0.2122802734375, -0.1828765869140625, -0.153472900390625, -0.1240692138671875, -0.09466552734375, -0.0652618408203125, -0.035858154296875, -0.0064544677734375, 0.02294921875, 0.0523529052734375, 0.081756591796875, 0.1111602783203125, 0.14056396484375, 0.1699676513671875, 0.199371337890625, 0.2287750244140625, 0.2581787109375, 0.2875823974609375, 0.316986083984375, 0.3463897705078125, 0.37579345703125, 0.4051971435546875, 0.434600830078125, 0.4640045166015625, 0.493408203125, 0.5228118896484375, 0.552215576171875, 0.5816192626953125, 0.61102294921875, 0.6404266357421875, 0.669830322265625, 0.6992340087890625, 0.7286376953125, 0.7580413818359375, 0.787445068359375, 0.8168487548828125, 0.84625244140625, 0.8756561279296875, 0.905059814453125, 0.9344635009765625, 0.9638671875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 6.0, 7.0, 7.0, 12.0, 11.0, 13.0, 13.0, 22.0, 24.0, 22.0, 23.0, 27.0, 32.0, 43.0, 60.0, 47.0, 45.0, 50.0, 42.0, 46.0, 47.0, 44.0, 58.0, 43.0, 35.0, 35.0, 39.0, 26.0, 19.0, 18.0, 23.0, 13.0, 6.0, 6.0, 6.0, 6.0, 3.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0019445419311523438, -0.0018886178731918335, -0.0018326938152313232, -0.001776769757270813, -0.0017208456993103027, -0.0016649216413497925, -0.0016089975833892822, -0.001553073525428772, -0.0014971494674682617, -0.0014412254095077515, -0.0013853013515472412, -0.001329377293586731, -0.0012734532356262207, -0.0012175291776657104, -0.0011616051197052002, -0.00110568106174469, -0.0010497570037841797, -0.0009938329458236694, -0.0009379088878631592, -0.0008819848299026489, -0.0008260607719421387, -0.0007701367139816284, -0.0007142126560211182, -0.0006582885980606079, -0.0006023645401000977, -0.0005464404821395874, -0.0004905164241790771, -0.0004345923662185669, -0.00037866830825805664, -0.0003227442502975464, -0.00026682019233703613, -0.00021089613437652588, -0.00015497207641601562, -9.904801845550537e-05, -4.312396049499512e-05, 1.2800097465515137e-05, 6.872415542602539e-05, 0.00012464821338653564, 0.0001805722713470459, 0.00023649632930755615, 0.0002924203872680664, 0.00034834444522857666, 0.0004042685031890869, 0.00046019256114959717, 0.0005161166191101074, 0.0005720406770706177, 0.0006279647350311279, 0.0006838887929916382, 0.0007398128509521484, 0.0007957369089126587, 0.0008516609668731689, 0.0009075850248336792, 0.0009635090827941895, 0.0010194331407546997, 0.00107535719871521, 0.0011312812566757202, 0.0011872053146362305, 0.0012431293725967407, 0.001299053430557251, 0.0013549774885177612, 0.0014109015464782715, 0.0014668256044387817, 0.001522749662399292, 0.0015786737203598022, 0.0016345977783203125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 11.0, 17.0, 16.0, 23.0, 31.0, 33.0, 52.0, 69.0, 68.0, 93.0, 120.0, 148.0, 176.0, 241.0, 468.0, 3518.0, 790093.0, 250050.0, 1835.0, 401.0, 248.0, 183.0, 136.0, 101.0, 81.0, 75.0, 41.0, 43.0, 41.0, 21.0, 25.0, 22.0, 16.0, 10.0, 9.0, 8.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.039947509765625, -0.038834571838378906, -0.03772163391113281, -0.03660869598388672, -0.035495758056640625, -0.03438282012939453, -0.03326988220214844, -0.032156944274902344, -0.03104400634765625, -0.029931068420410156, -0.028818130493164062, -0.02770519256591797, -0.026592254638671875, -0.02547931671142578, -0.024366378784179688, -0.023253440856933594, -0.0221405029296875, -0.021027565002441406, -0.019914627075195312, -0.01880168914794922, -0.017688751220703125, -0.01657581329345703, -0.015462875366210938, -0.014349937438964844, -0.01323699951171875, -0.012124061584472656, -0.011011123657226562, -0.009898185729980469, -0.008785247802734375, -0.007672309875488281, -0.0065593719482421875, -0.005446434020996094, -0.00433349609375, -0.0032205581665039062, -0.0021076202392578125, -0.0009946823120117188, 0.000118255615234375, 0.0012311935424804688, 0.0023441314697265625, 0.0034570693969726562, 0.00457000732421875, 0.005682945251464844, 0.0067958831787109375, 0.007908821105957031, 0.009021759033203125, 0.010134696960449219, 0.011247634887695312, 0.012360572814941406, 0.0134735107421875, 0.014586448669433594, 0.015699386596679688, 0.01681232452392578, 0.017925262451171875, 0.01903820037841797, 0.020151138305664062, 0.021264076232910156, 0.02237701416015625, 0.023489952087402344, 0.024602890014648438, 0.02571582794189453, 0.026828765869140625, 0.02794170379638672, 0.029054641723632812, 0.030167579650878906, 0.031280517578125]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 12.0, 36.0, 350.0, 504.0, 99.0, 13.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025644097477197647, -0.002353518968448043, -0.002142628189176321, -0.001931737526319921, -0.001720846863463521, -0.0015099560841917992, -0.0012990653049200773, -0.0010881746420636773, -0.0008772838627919555, -0.0006663931417278945, -0.00045550239156000316, -0.0002446116413921118, -3.372092032805085e-05, 0.00017716980073601007, 0.0003880605800077319, 0.0005989512428641319, 0.0008098420221358538, 0.0010207328014075756, 0.0012316234642639756, 0.0014425142435356975, 0.0016534049063920975, 0.0018642956856638193, 0.002075186464935541, 0.0022860770113766193, 0.002496968023478985, 0.0027078588027507067, 0.0029187495820224285, 0.0031296401284635067, 0.0033405309077352285, 0.0035514216870069504, 0.0037623124662786722, 0.003973203245550394, 0.004184093791991472, 0.00439498433843255, 0.004605875350534916, 0.004816765896975994, 0.00502765690907836, 0.005238547455519438, 0.005449438467621803, 0.0056603290140628815, 0.00587121956050396, 0.006082110106945038, 0.006293001119047403, 0.0065038916654884815, 0.006714782677590847, 0.006925673224031925, 0.007136563770473003, 0.007347454782575369, 0.007558345794677734, 0.0077692363411188126, 0.00798012688755989, 0.008191018365323544, 0.008401908911764622, 0.0086127994582057, 0.008823690004646778, 0.009034580551087856, 0.009245471097528934, 0.009456361643970013, 0.00966725219041109, 0.009878143668174744, 0.010089034214615822, 0.0102999247610569, 0.010510815307497978, 0.010721705853939056, 0.01093259733170271]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 11.0, 7.0, 9.0, 15.0, 25.0, 25.0, 14.0, 29.0, 29.0, 30.0, 30.0, 37.0, 35.0, 40.0, 47.0, 47.0, 50.0, 36.0, 35.0, 48.0, 31.0, 36.0, 46.0, 33.0, 37.0, 33.0, 26.0, 22.0, 23.0, 24.0, 15.0, 15.0, 14.0, 10.0, 9.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011314153671264648, -0.0010961266234517097, -0.0010608378797769547, -0.0010255491361021996, -0.0009902603924274445, -0.0009549716487526894, -0.0009196829050779343, -0.0008843941614031792, -0.0008491054177284241, -0.000813816674053669, -0.0007785279303789139, -0.0007432391867041588, -0.0007079504430294037, -0.0006726616993546486, -0.0006373729556798935, -0.0006020842120051384, -0.0005667954683303833, -0.0005315067246556282, -0.0004962179809808731, -0.000460929237306118, -0.0004256404936313629, -0.0003903517499566078, -0.0003550630062818527, -0.0003197742626070976, -0.00028448551893234253, -0.00024919677525758743, -0.00021390803158283234, -0.00017861928790807724, -0.00014333054423332214, -0.00010804180055856705, -7.275305688381195e-05, -3.7464313209056854e-05, -2.175569534301758e-06, 3.311317414045334e-05, 6.840191781520844e-05, 0.00010369066148996353, 0.00013897940516471863, 0.00017426814883947372, 0.00020955689251422882, 0.0002448456361889839, 0.000280134379863739, 0.0003154231235384941, 0.0003507118672132492, 0.0003860006108880043, 0.0004212893545627594, 0.0004565780982375145, 0.0004918668419122696, 0.0005271555855870247, 0.0005624443292617798, 0.0005977330729365349, 0.00063302181661129, 0.0006683105602860451, 0.0007035993039608002, 0.0007388880476355553, 0.0007741767913103104, 0.0008094655349850655, 0.0008447542786598206, 0.0008800430223345757, 0.0009153317660093307, 0.0009506205096840858, 0.000985909253358841, 0.001021197997033596, 0.0010564867407083511, 0.0010917754843831062, 0.0011270642280578613]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 6.0, 10.0, 7.0, 21.0, 31.0, 30.0, 35.0, 41.0, 46.0, 51.0, 51.0, 66.0, 72.0, 64.0, 72.0, 60.0, 53.0, 68.0, 54.0, 32.0, 27.0, 21.0, 18.0, 18.0, 16.0, 8.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.078125, -13.642822265625, -13.20751953125, -12.772216796875, -12.3369140625, -11.901611328125, -11.46630859375, -11.031005859375, -10.595703125, -10.160400390625, -9.72509765625, -9.289794921875, -8.8544921875, -8.419189453125, -7.98388671875, -7.548583984375, -7.11328125, -6.677978515625, -6.24267578125, -5.807373046875, -5.3720703125, -4.936767578125, -4.50146484375, -4.066162109375, -3.630859375, -3.195556640625, -2.76025390625, -2.324951171875, -1.8896484375, -1.454345703125, -1.01904296875, -0.583740234375, -0.1484375, 0.286865234375, 0.72216796875, 1.157470703125, 1.5927734375, 2.028076171875, 2.46337890625, 2.898681640625, 3.333984375, 3.769287109375, 4.20458984375, 4.639892578125, 5.0751953125, 5.510498046875, 5.94580078125, 6.381103515625, 6.81640625, 7.251708984375, 7.68701171875, 8.122314453125, 8.5576171875, 8.992919921875, 9.42822265625, 9.863525390625, 10.298828125, 10.734130859375, 11.16943359375, 11.604736328125, 12.0400390625, 12.475341796875, 12.91064453125, 13.345947265625, 13.78125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 6.0, 3.0, 1.0, 9.0, 15.0, 21.0, 20.0, 28.0, 54.0, 83.0, 158.0, 252.0, 433.0, 894.0, 1786.0, 3883.0, 9828.0, 31833.0, 158189.0, 644161.0, 149120.0, 30693.0, 9569.0, 3859.0, 1735.0, 815.0, 433.0, 265.0, 145.0, 99.0, 60.0, 37.0, 20.0, 22.0, 10.0, 8.0, 2.0, 6.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8984375, -8.62451171875, -8.3505859375, -8.07666015625, -7.802734375, -7.52880859375, -7.2548828125, -6.98095703125, -6.70703125, -6.43310546875, -6.1591796875, -5.88525390625, -5.611328125, -5.33740234375, -5.0634765625, -4.78955078125, -4.515625, -4.24169921875, -3.9677734375, -3.69384765625, -3.419921875, -3.14599609375, -2.8720703125, -2.59814453125, -2.32421875, -2.05029296875, -1.7763671875, -1.50244140625, -1.228515625, -0.95458984375, -0.6806640625, -0.40673828125, -0.1328125, 0.14111328125, 0.4150390625, 0.68896484375, 0.962890625, 1.23681640625, 1.5107421875, 1.78466796875, 2.05859375, 2.33251953125, 2.6064453125, 2.88037109375, 3.154296875, 3.42822265625, 3.7021484375, 3.97607421875, 4.25, 4.52392578125, 4.7978515625, 5.07177734375, 5.345703125, 5.61962890625, 5.8935546875, 6.16748046875, 6.44140625, 6.71533203125, 6.9892578125, 7.26318359375, 7.537109375, 7.81103515625, 8.0849609375, 8.35888671875, 8.6328125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 2.0, 11.0, 13.0, 11.0, 15.0, 17.0, 10.0, 9.0, 17.0, 22.0, 30.0, 31.0, 24.0, 27.0, 31.0, 36.0, 56.0, 60.0, 91.0, 1808.0, 211.0, 71.0, 45.0, 49.0, 51.0, 31.0, 38.0, 25.0, 27.0, 12.0, 28.0, 25.0, 17.0, 14.0, 14.0, 12.0, 11.0, 4.0, 6.0, 6.0, 12.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-37.3125, -36.29833984375, -35.2841796875, -34.27001953125, -33.255859375, -32.24169921875, -31.2275390625, -30.21337890625, -29.19921875, -28.18505859375, -27.1708984375, -26.15673828125, -25.142578125, -24.12841796875, -23.1142578125, -22.10009765625, -21.0859375, -20.07177734375, -19.0576171875, -18.04345703125, -17.029296875, -16.01513671875, -15.0009765625, -13.98681640625, -12.97265625, -11.95849609375, -10.9443359375, -9.93017578125, -8.916015625, -7.90185546875, -6.8876953125, -5.87353515625, -4.859375, -3.84521484375, -2.8310546875, -1.81689453125, -0.802734375, 0.21142578125, 1.2255859375, 2.23974609375, 3.25390625, 4.26806640625, 5.2822265625, 6.29638671875, 7.310546875, 8.32470703125, 9.3388671875, 10.35302734375, 11.3671875, 12.38134765625, 13.3955078125, 14.40966796875, 15.423828125, 16.43798828125, 17.4521484375, 18.46630859375, 19.48046875, 20.49462890625, 21.5087890625, 22.52294921875, 23.537109375, 24.55126953125, 25.5654296875, 26.57958984375, 27.59375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 5.0, 3.0, 9.0, 5.0, 13.0, 14.0, 17.0, 18.0, 19.0, 29.0, 26.0, 28.0, 28.0, 67.0, 74.0, 124.0, 249.0, 526.0, 1597.0, 19069.0, 3089057.0, 31418.0, 1951.0, 570.0, 261.0, 132.0, 82.0, 50.0, 56.0, 24.0, 33.0, 22.0, 15.0, 14.0, 11.0, 17.0, 15.0, 11.0, 11.0, 5.0, 5.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-45.28125, -43.576171875, -41.87109375, -40.166015625, -38.4609375, -36.755859375, -35.05078125, -33.345703125, -31.640625, -29.935546875, -28.23046875, -26.525390625, -24.8203125, -23.115234375, -21.41015625, -19.705078125, -18.0, -16.294921875, -14.58984375, -12.884765625, -11.1796875, -9.474609375, -7.76953125, -6.064453125, -4.359375, -2.654296875, -0.94921875, 0.755859375, 2.4609375, 4.166015625, 5.87109375, 7.576171875, 9.28125, 10.986328125, 12.69140625, 14.396484375, 16.1015625, 17.806640625, 19.51171875, 21.216796875, 22.921875, 24.626953125, 26.33203125, 28.037109375, 29.7421875, 31.447265625, 33.15234375, 34.857421875, 36.5625, 38.267578125, 39.97265625, 41.677734375, 43.3828125, 45.087890625, 46.79296875, 48.498046875, 50.203125, 51.908203125, 53.61328125, 55.318359375, 57.0234375, 58.728515625, 60.43359375, 62.138671875, 63.84375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 20.0, 666.0, 322.0, 11.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-302.28594970703125, -296.0950622558594, -289.9042053222656, -283.71331787109375, -277.5224304199219, -271.3315734863281, -265.14068603515625, -258.9498291015625, -252.75894165039062, -246.5680694580078, -240.37718200683594, -234.18630981445312, -227.9954376220703, -221.8045654296875, -215.61367797851562, -209.4228057861328, -203.23193359375, -197.0410614013672, -190.8501739501953, -184.6593017578125, -178.4684295654297, -172.27755737304688, -166.086669921875, -159.8957977294922, -153.7049102783203, -147.5140380859375, -141.32315063476562, -135.1322784423828, -128.94140625, -122.75052642822266, -116.55964660644531, -110.3687744140625, -104.17790985107422, -97.98703002929688, -91.79615783691406, -85.60527801513672, -79.4144058227539, -73.22352600097656, -67.03265380859375, -60.841773986816406, -54.65089797973633, -48.46002197265625, -42.26914596557617, -36.078269958496094, -29.887392044067383, -23.696516036987305, -17.505638122558594, -11.314762115478516, -5.1238861083984375, 1.0669903755187988, 7.257866859436035, 13.44874382019043, 19.639619827270508, 25.830495834350586, 32.0213737487793, 38.212249755859375, 44.40312576293945, 50.59400177001953, 56.78487777709961, 62.97575378417969, 69.16663360595703, 75.35750579833984, 81.54838562011719, 87.7392578125, 93.93013763427734]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 3.0, 7.0, 5.0, 16.0, 8.0, 13.0, 24.0, 15.0, 21.0, 23.0, 30.0, 32.0, 44.0, 36.0, 42.0, 45.0, 35.0, 38.0, 46.0, 47.0, 46.0, 35.0, 37.0, 37.0, 44.0, 42.0, 45.0, 26.0, 26.0, 25.0, 24.0, 15.0, 10.0, 12.0, 11.0, 5.0, 5.0, 4.0, 9.0, 2.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-136.15957641601562, -132.196044921875, -128.2324981689453, -124.26895904541016, -120.305419921875, -116.34188079833984, -112.37834167480469, -108.41481018066406, -104.45126342773438, -100.48772430419922, -96.52418518066406, -92.5606460571289, -88.59710693359375, -84.6335678100586, -80.67002868652344, -76.70649719238281, -72.74295806884766, -68.7794189453125, -64.81587982177734, -60.85234069824219, -56.88880157470703, -52.925262451171875, -48.961727142333984, -44.99818801879883, -41.03464889526367, -37.071109771728516, -33.10757064819336, -29.144033432006836, -25.18049430847168, -21.216955184936523, -17.25341796875, -13.289878845214844, -9.326332092285156, -5.362793445587158, -1.3992547988891602, 2.5642833709716797, 6.527822494506836, 10.491361618041992, 14.454898834228516, 18.418437957763672, 22.381977081298828, 26.345516204833984, 30.30905532836914, 34.27259063720703, 38.23612976074219, 42.199668884277344, 46.1632080078125, 50.126747131347656, 54.09028625488281, 58.05382537841797, 62.017364501953125, 65.98090362548828, 69.94444274902344, 73.9079818725586, 77.87152099609375, 81.83505249023438, 85.79859924316406, 89.76213836669922, 93.72567749023438, 97.68921661376953, 101.65275573730469, 105.61629486083984, 109.579833984375, 113.54336547851562, 117.50690460205078]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 5.0, 4.0, 9.0, 7.0, 11.0, 24.0, 29.0, 23.0, 37.0, 39.0, 49.0, 42.0, 47.0, 69.0, 61.0, 59.0, 74.0, 58.0, 62.0, 55.0, 53.0, 45.0, 29.0, 28.0, 13.0, 19.0, 20.0, 7.0, 12.0, 6.0, 3.0, 2.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1953125, -13.760009765625, -13.32470703125, -12.889404296875, -12.4541015625, -12.018798828125, -11.58349609375, -11.148193359375, -10.712890625, -10.277587890625, -9.84228515625, -9.406982421875, -8.9716796875, -8.536376953125, -8.10107421875, -7.665771484375, -7.23046875, -6.795166015625, -6.35986328125, -5.924560546875, -5.4892578125, -5.053955078125, -4.61865234375, -4.183349609375, -3.748046875, -3.312744140625, -2.87744140625, -2.442138671875, -2.0068359375, -1.571533203125, -1.13623046875, -0.700927734375, -0.265625, 0.169677734375, 0.60498046875, 1.040283203125, 1.4755859375, 1.910888671875, 2.34619140625, 2.781494140625, 3.216796875, 3.652099609375, 4.08740234375, 4.522705078125, 4.9580078125, 5.393310546875, 5.82861328125, 6.263916015625, 6.69921875, 7.134521484375, 7.56982421875, 8.005126953125, 8.4404296875, 8.875732421875, 9.31103515625, 9.746337890625, 10.181640625, 10.616943359375, 11.05224609375, 11.487548828125, 11.9228515625, 12.358154296875, 12.79345703125, 13.228759765625, 13.6640625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 13.0, 12.0, 12.0, 23.0, 30.0, 34.0, 52.0, 57.0, 113.0, 250.0, 1043.0, 10120.0, 4142125.0, 38066.0, 1627.0, 330.0, 99.0, 73.0, 61.0, 25.0, 19.0, 22.0, 19.0, 15.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-108.9375, -105.6982421875, -102.458984375, -99.2197265625, -95.98046875, -92.7412109375, -89.501953125, -86.2626953125, -83.0234375, -79.7841796875, -76.544921875, -73.3056640625, -70.06640625, -66.8271484375, -63.587890625, -60.3486328125, -57.109375, -53.8701171875, -50.630859375, -47.3916015625, -44.15234375, -40.9130859375, -37.673828125, -34.4345703125, -31.1953125, -27.9560546875, -24.716796875, -21.4775390625, -18.23828125, -14.9990234375, -11.759765625, -8.5205078125, -5.28125, -2.0419921875, 1.197265625, 4.4365234375, 7.67578125, 10.9150390625, 14.154296875, 17.3935546875, 20.6328125, 23.8720703125, 27.111328125, 30.3505859375, 33.58984375, 36.8291015625, 40.068359375, 43.3076171875, 46.546875, 49.7861328125, 53.025390625, 56.2646484375, 59.50390625, 62.7431640625, 65.982421875, 69.2216796875, 72.4609375, 75.7001953125, 78.939453125, 82.1787109375, 85.41796875, 88.6572265625, 91.896484375, 95.1357421875, 98.375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 5.0, 6.0, 10.0, 14.0, 6.0, 12.0, 24.0, 21.0, 37.0, 61.0, 104.0, 226.0, 503.0, 848.0, 1003.0, 596.0, 281.0, 135.0, 74.0, 35.0, 18.0, 13.0, 6.0, 10.0, 7.0, 6.0, 10.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.78125, -31.65380859375, -30.5263671875, -29.39892578125, -28.271484375, -27.14404296875, -26.0166015625, -24.88916015625, -23.76171875, -22.63427734375, -21.5068359375, -20.37939453125, -19.251953125, -18.12451171875, -16.9970703125, -15.86962890625, -14.7421875, -13.61474609375, -12.4873046875, -11.35986328125, -10.232421875, -9.10498046875, -7.9775390625, -6.85009765625, -5.72265625, -4.59521484375, -3.4677734375, -2.34033203125, -1.212890625, -0.08544921875, 1.0419921875, 2.16943359375, 3.296875, 4.42431640625, 5.5517578125, 6.67919921875, 7.806640625, 8.93408203125, 10.0615234375, 11.18896484375, 12.31640625, 13.44384765625, 14.5712890625, 15.69873046875, 16.826171875, 17.95361328125, 19.0810546875, 20.20849609375, 21.3359375, 22.46337890625, 23.5908203125, 24.71826171875, 25.845703125, 26.97314453125, 28.1005859375, 29.22802734375, 30.35546875, 31.48291015625, 32.6103515625, 33.73779296875, 34.865234375, 35.99267578125, 37.1201171875, 38.24755859375, 39.375]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 9.0, 8.0, 8.0, 8.0, 16.0, 26.0, 47.0, 80.0, 182.0, 459.0, 990.0, 3499.0, 13223.0, 86923.0, 3894050.0, 171037.0, 17216.0, 4300.0, 1259.0, 495.0, 208.0, 94.0, 66.0, 21.0, 20.0, 14.0, 13.0, 5.0, 8.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-83.5625, -81.21484375, -78.8671875, -76.51953125, -74.171875, -71.82421875, -69.4765625, -67.12890625, -64.78125, -62.43359375, -60.0859375, -57.73828125, -55.390625, -53.04296875, -50.6953125, -48.34765625, -46.0, -43.65234375, -41.3046875, -38.95703125, -36.609375, -34.26171875, -31.9140625, -29.56640625, -27.21875, -24.87109375, -22.5234375, -20.17578125, -17.828125, -15.48046875, -13.1328125, -10.78515625, -8.4375, -6.08984375, -3.7421875, -1.39453125, 0.953125, 3.30078125, 5.6484375, 7.99609375, 10.34375, 12.69140625, 15.0390625, 17.38671875, 19.734375, 22.08203125, 24.4296875, 26.77734375, 29.125, 31.47265625, 33.8203125, 36.16796875, 38.515625, 40.86328125, 43.2109375, 45.55859375, 47.90625, 50.25390625, 52.6015625, 54.94921875, 57.296875, 59.64453125, 61.9921875, 64.33984375, 66.6875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 5.0, 1.0, 12.0, 13.0, 38.0, 55.0, 105.0, 190.0, 231.0, 157.0, 91.0, 41.0, 29.0, 17.0, 7.0, 6.0, 3.0, 2.0, 4.0, 3.0], "bins": [-254.2326202392578, -249.38121032714844, -244.52980041503906, -239.6783905029297, -234.8269805908203, -229.97557067871094, -225.12416076660156, -220.27273559570312, -215.42132568359375, -210.56991577148438, -205.718505859375, -200.86709594726562, -196.01568603515625, -191.16427612304688, -186.3128662109375, -181.46145629882812, -176.61004638671875, -171.75863647460938, -166.9072265625, -162.05581665039062, -157.20440673828125, -152.35299682617188, -147.5015869140625, -142.65017700195312, -137.79876708984375, -132.94735717773438, -128.095947265625, -123.24453735351562, -118.39312744140625, -113.54171752929688, -108.69029998779297, -103.8388900756836, -98.98746490478516, -94.13605499267578, -89.2846450805664, -84.43323516845703, -79.58181762695312, -74.73040771484375, -69.87899780273438, -65.027587890625, -60.176177978515625, -55.32476806640625, -50.473358154296875, -45.621944427490234, -40.77053451538086, -35.919124603271484, -31.067712783813477, -26.21630096435547, -21.364891052246094, -16.51348114013672, -11.662069320678711, -6.8106584548950195, -1.9592475891113281, 2.892162322998047, 7.743574142456055, 12.594985961914062, 17.446395874023438, 22.297805786132812, 27.14921760559082, 32.00062942504883, 36.8520393371582, 41.70344924926758, 46.55486297607422, 51.406272888183594, 56.25768280029297]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 11.0, 15.0, 10.0, 20.0, 21.0, 21.0, 23.0, 28.0, 36.0, 34.0, 34.0, 33.0, 46.0, 40.0, 36.0, 33.0, 52.0, 41.0, 34.0, 44.0, 44.0, 39.0, 36.0, 39.0, 22.0, 24.0, 29.0, 18.0, 29.0, 16.0, 20.0, 14.0, 8.0, 8.0, 8.0, 4.0, 6.0, 6.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.7210693359375, -64.40259552001953, -62.08412551879883, -59.76565170288086, -57.447181701660156, -55.12870788574219, -52.81023406982422, -50.491764068603516, -48.17329406738281, -45.854820251464844, -43.53635025024414, -41.21787643432617, -38.89940643310547, -36.5809326171875, -34.26245880126953, -31.943988800048828, -29.62551498413086, -27.307043075561523, -24.988571166992188, -22.67009735107422, -20.351627349853516, -18.033153533935547, -15.714681625366211, -13.396209716796875, -11.077737808227539, -8.759265899658203, -6.440793514251709, -4.122321128845215, -1.803849220275879, 0.514622688293457, 2.8330955505371094, 5.151567459106445, 7.470039367675781, 9.788511276245117, 12.106983184814453, 14.425456047058105, 16.743927001953125, 19.062400817871094, 21.38087272644043, 23.699344635009766, 26.0178165435791, 28.336288452148438, 30.654760360717773, 32.97323226928711, 35.29170608520508, 37.61017608642578, 39.92864990234375, 42.24712371826172, 44.56559371948242, 46.88406753540039, 49.202537536621094, 51.52101135253906, 53.839481353759766, 56.157955169677734, 58.47642517089844, 60.794898986816406, 63.113372802734375, 65.43184661865234, 67.75032043457031, 70.06878662109375, 72.38726043701172, 74.70573425292969, 77.02420806884766, 79.34268188476562, 81.66114807128906]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 9.0, 15.0, 18.0, 23.0, 29.0, 32.0, 26.0, 33.0, 42.0, 55.0, 42.0, 58.0, 52.0, 58.0, 53.0, 64.0, 56.0, 41.0, 50.0, 36.0, 34.0, 35.0, 23.0, 20.0, 20.0, 19.0, 15.0, 6.0, 8.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6953125, -12.2977294921875, -11.900146484375, -11.5025634765625, -11.10498046875, -10.7073974609375, -10.309814453125, -9.9122314453125, -9.5146484375, -9.1170654296875, -8.719482421875, -8.3218994140625, -7.92431640625, -7.5267333984375, -7.129150390625, -6.7315673828125, -6.333984375, -5.9364013671875, -5.538818359375, -5.1412353515625, -4.74365234375, -4.3460693359375, -3.948486328125, -3.5509033203125, -3.1533203125, -2.7557373046875, -2.358154296875, -1.9605712890625, -1.56298828125, -1.1654052734375, -0.767822265625, -0.3702392578125, 0.02734375, 0.4249267578125, 0.822509765625, 1.2200927734375, 1.61767578125, 2.0152587890625, 2.412841796875, 2.8104248046875, 3.2080078125, 3.6055908203125, 4.003173828125, 4.4007568359375, 4.79833984375, 5.1959228515625, 5.593505859375, 5.9910888671875, 6.388671875, 6.7862548828125, 7.183837890625, 7.5814208984375, 7.97900390625, 8.3765869140625, 8.774169921875, 9.1717529296875, 9.5693359375, 9.9669189453125, 10.364501953125, 10.7620849609375, 11.15966796875, 11.5572509765625, 11.954833984375, 12.3524169921875, 12.75]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 16.0, 23.0, 30.0, 46.0, 49.0, 98.0, 143.0, 272.0, 443.0, 662.0, 1150.0, 1900.0, 3380.0, 5885.0, 11373.0, 22100.0, 45546.0, 103238.0, 266370.0, 335740.0, 134998.0, 57120.0, 27422.0, 13705.0, 7180.0, 3937.0, 2296.0, 1352.0, 824.0, 474.0, 288.0, 168.0, 113.0, 71.0, 50.0, 28.0, 18.0, 9.0, 14.0, 2.0, 7.0, 0.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.4609375, -1.41937255859375, -1.3778076171875, -1.33624267578125, -1.294677734375, -1.25311279296875, -1.2115478515625, -1.16998291015625, -1.12841796875, -1.08685302734375, -1.0452880859375, -1.00372314453125, -0.962158203125, -0.92059326171875, -0.8790283203125, -0.83746337890625, -0.7958984375, -0.75433349609375, -0.7127685546875, -0.67120361328125, -0.629638671875, -0.58807373046875, -0.5465087890625, -0.50494384765625, -0.46337890625, -0.42181396484375, -0.3802490234375, -0.33868408203125, -0.297119140625, -0.25555419921875, -0.2139892578125, -0.17242431640625, -0.130859375, -0.08929443359375, -0.0477294921875, -0.00616455078125, 0.035400390625, 0.07696533203125, 0.1185302734375, 0.16009521484375, 0.20166015625, 0.24322509765625, 0.2847900390625, 0.32635498046875, 0.367919921875, 0.40948486328125, 0.4510498046875, 0.49261474609375, 0.5341796875, 0.57574462890625, 0.6173095703125, 0.65887451171875, 0.700439453125, 0.74200439453125, 0.7835693359375, 0.82513427734375, 0.86669921875, 0.90826416015625, 0.9498291015625, 0.99139404296875, 1.032958984375, 1.07452392578125, 1.1160888671875, 1.15765380859375, 1.19921875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 4.0, 5.0, 3.0, 4.0, 3.0, 1.0, 5.0, 6.0, 7.0, 10.0, 15.0, 13.0, 14.0, 15.0, 17.0, 13.0, 23.0, 18.0, 16.0, 25.0, 30.0, 32.0, 24.0, 34.0, 30.0, 25.0, 32.0, 42.0, 1066.0, 37.0, 39.0, 45.0, 33.0, 31.0, 24.0, 30.0, 25.0, 31.0, 24.0, 18.0, 30.0, 18.0, 18.0, 14.0, 21.0, 15.0, 13.0, 4.0, 6.0, 9.0, 5.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.11328125, -4.9422607421875, -4.771240234375, -4.6002197265625, -4.42919921875, -4.2581787109375, -4.087158203125, -3.9161376953125, -3.7451171875, -3.5740966796875, -3.403076171875, -3.2320556640625, -3.06103515625, -2.8900146484375, -2.718994140625, -2.5479736328125, -2.376953125, -2.2059326171875, -2.034912109375, -1.8638916015625, -1.69287109375, -1.5218505859375, -1.350830078125, -1.1798095703125, -1.0087890625, -0.8377685546875, -0.666748046875, -0.4957275390625, -0.32470703125, -0.1536865234375, 0.017333984375, 0.1883544921875, 0.359375, 0.5303955078125, 0.701416015625, 0.8724365234375, 1.04345703125, 1.2144775390625, 1.385498046875, 1.5565185546875, 1.7275390625, 1.8985595703125, 2.069580078125, 2.2406005859375, 2.41162109375, 2.5826416015625, 2.753662109375, 2.9246826171875, 3.095703125, 3.2667236328125, 3.437744140625, 3.6087646484375, 3.77978515625, 3.9508056640625, 4.121826171875, 4.2928466796875, 4.4638671875, 4.6348876953125, 4.805908203125, 4.9769287109375, 5.14794921875, 5.3189697265625, 5.489990234375, 5.6610107421875, 5.83203125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 16.0, 12.0, 17.0, 37.0, 44.0, 63.0, 85.0, 124.0, 181.0, 264.0, 418.0, 667.0, 1067.0, 1736.0, 2602.0, 4164.0, 6288.0, 10272.0, 16665.0, 27182.0, 46228.0, 82320.0, 163202.0, 1329052.0, 184662.0, 91264.0, 50601.0, 29997.0, 17554.0, 11027.0, 6946.0, 4506.0, 2841.0, 1817.0, 1141.0, 657.0, 480.0, 300.0, 205.0, 144.0, 72.0, 66.0, 42.0, 30.0, 23.0, 21.0, 10.0, 7.0, 6.0, 3.0, 6.0, 0.0, 3.0], "bins": [-0.9873046875, -0.9587554931640625, -0.930206298828125, -0.9016571044921875, -0.87310791015625, -0.8445587158203125, -0.816009521484375, -0.7874603271484375, -0.7589111328125, -0.7303619384765625, -0.701812744140625, -0.6732635498046875, -0.64471435546875, -0.6161651611328125, -0.587615966796875, -0.5590667724609375, -0.530517578125, -0.5019683837890625, -0.473419189453125, -0.4448699951171875, -0.41632080078125, -0.3877716064453125, -0.359222412109375, -0.3306732177734375, -0.3021240234375, -0.2735748291015625, -0.245025634765625, -0.2164764404296875, -0.18792724609375, -0.1593780517578125, -0.130828857421875, -0.1022796630859375, -0.07373046875, -0.0451812744140625, -0.016632080078125, 0.0119171142578125, 0.04046630859375, 0.0690155029296875, 0.097564697265625, 0.1261138916015625, 0.1546630859375, 0.1832122802734375, 0.211761474609375, 0.2403106689453125, 0.26885986328125, 0.2974090576171875, 0.325958251953125, 0.3545074462890625, 0.383056640625, 0.4116058349609375, 0.440155029296875, 0.4687042236328125, 0.49725341796875, 0.5258026123046875, 0.554351806640625, 0.5829010009765625, 0.6114501953125, 0.6399993896484375, 0.668548583984375, 0.6970977783203125, 0.72564697265625, 0.7541961669921875, 0.782745361328125, 0.8112945556640625, 0.83984375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 6.0, 2.0, 2.0, 1.0, 5.0, 5.0, 9.0, 2.0, 6.0, 4.0, 7.0, 11.0, 25.0, 23.0, 18.0, 33.0, 35.0, 43.0, 39.0, 51.0, 58.0, 50.0, 52.0, 42.0, 56.0, 52.0, 54.0, 46.0, 41.0, 48.0, 20.0, 24.0, 22.0, 23.0, 21.0, 14.0, 15.0, 3.0, 8.0, 2.0, 7.0, 2.0, 3.0, 0.0, 1.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0], "bins": [-0.002338409423828125, -0.0022737830877304077, -0.0022091567516326904, -0.002144530415534973, -0.002079904079437256, -0.0020152777433395386, -0.0019506514072418213, -0.001886025071144104, -0.0018213987350463867, -0.0017567723989486694, -0.0016921460628509521, -0.0016275197267532349, -0.0015628933906555176, -0.0014982670545578003, -0.001433640718460083, -0.0013690143823623657, -0.0013043880462646484, -0.0012397617101669312, -0.0011751353740692139, -0.0011105090379714966, -0.0010458827018737793, -0.000981256365776062, -0.0009166300296783447, -0.0008520036935806274, -0.0007873773574829102, -0.0007227510213851929, -0.0006581246852874756, -0.0005934983491897583, -0.000528872013092041, -0.00046424567699432373, -0.00039961934089660645, -0.00033499300479888916, -0.0002703666687011719, -0.0002057403326034546, -0.0001411139965057373, -7.648766040802002e-05, -1.1861324310302734e-05, 5.276501178741455e-05, 0.00011739134788513184, 0.00018201768398284912, 0.0002466440200805664, 0.0003112703561782837, 0.000375896692276001, 0.00044052302837371826, 0.0005051493644714355, 0.0005697757005691528, 0.0006344020366668701, 0.0006990283727645874, 0.0007636547088623047, 0.000828281044960022, 0.0008929073810577393, 0.0009575337171554565, 0.0010221600532531738, 0.0010867863893508911, 0.0011514127254486084, 0.0012160390615463257, 0.001280665397644043, 0.0013452917337417603, 0.0014099180698394775, 0.0014745444059371948, 0.0015391707420349121, 0.0016037970781326294, 0.0016684234142303467, 0.001733049750328064, 0.0017976760864257812]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 6.0, 5.0, 13.0, 19.0, 23.0, 29.0, 29.0, 41.0, 42.0, 51.0, 88.0, 122.0, 174.0, 244.0, 348.0, 830.0, 33753.0, 999583.0, 11275.0, 691.0, 330.0, 213.0, 157.0, 126.0, 94.0, 74.0, 39.0, 39.0, 24.0, 14.0, 14.0, 12.0, 6.0, 5.0, 8.0, 6.0, 6.0, 3.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.038299560546875, -0.03695106506347656, -0.035602569580078125, -0.03425407409667969, -0.03290557861328125, -0.03155708312988281, -0.030208587646484375, -0.028860092163085938, -0.0275115966796875, -0.026163101196289062, -0.024814605712890625, -0.023466110229492188, -0.02211761474609375, -0.020769119262695312, -0.019420623779296875, -0.018072128295898438, -0.0167236328125, -0.015375137329101562, -0.014026641845703125, -0.012678146362304688, -0.01132965087890625, -0.009981155395507812, -0.008632659912109375, -0.0072841644287109375, -0.0059356689453125, -0.0045871734619140625, -0.003238677978515625, -0.0018901824951171875, -0.00054168701171875, 0.0008068084716796875, 0.002155303955078125, 0.0035037994384765625, 0.004852294921875, 0.0062007904052734375, 0.007549285888671875, 0.008897781372070312, 0.01024627685546875, 0.011594772338867188, 0.012943267822265625, 0.014291763305664062, 0.0156402587890625, 0.016988754272460938, 0.018337249755859375, 0.019685745239257812, 0.02103424072265625, 0.022382736206054688, 0.023731231689453125, 0.025079727172851562, 0.02642822265625, 0.027776718139648438, 0.029125213623046875, 0.030473709106445312, 0.03182220458984375, 0.03317070007324219, 0.034519195556640625, 0.03586769104003906, 0.0372161865234375, 0.03856468200683594, 0.039913177490234375, 0.04126167297363281, 0.04261016845703125, 0.04395866394042969, 0.045307159423828125, 0.04665565490722656, 0.048004150390625]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 8.0, 29.0, 205.0, 512.0, 217.0, 39.0, 6.0, 1.0, 2.0], "bins": [-0.011850136332213879, -0.01164769846946001, -0.011445260606706142, -0.0112428218126297, -0.011040383949875832, -0.010837946087121964, -0.010635508224368095, -0.010433070361614227, -0.01023063249886036, -0.010028194636106491, -0.009825756773352623, -0.00962331797927618, -0.009420880116522312, -0.009218442253768444, -0.009016004391014576, -0.008813566528260708, -0.008611127734184265, -0.008408689871430397, -0.008206252008676529, -0.008003813214600086, -0.007801375351846218, -0.00759893748909235, -0.007396499626338482, -0.007194061763584614, -0.006991623435169458, -0.00678918557241559, -0.006586747244000435, -0.006384309381246567, -0.006181871518492699, -0.005979433190077543, -0.005776995327323675, -0.00557455699890852, -0.005372119136154652, -0.0051696812734007835, -0.004967242944985628, -0.00476480508223176, -0.004562366753816605, -0.0043599288910627365, -0.004157491028308868, -0.003955053165555, -0.003752614837139845, -0.003550176741555333, -0.0033477386459708214, -0.0031453007832169533, -0.0029428626876324415, -0.0027404245920479298, -0.0025379867292940617, -0.00233554863370955, -0.002133110538125038, -0.0019306724425405264, -0.0017282344633713365, -0.0015257964842021465, -0.0013233583886176348, -0.001120920293033123, -0.0009184823138639331, -0.0007160443346947432, -0.0005136063555255532, -0.0003111683181487024, -0.00010873028077185154, 9.37077566049993e-05, 0.00029614579398185015, 0.0004985838895663619, 0.0007010218687355518, 0.0009034598479047418, 0.0011058979434892535]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 6.0, 8.0, 20.0, 14.0, 10.0, 23.0, 16.0, 24.0, 27.0, 35.0, 29.0, 33.0, 27.0, 38.0, 44.0, 38.0, 44.0, 45.0, 51.0, 37.0, 33.0, 30.0, 22.0, 40.0, 38.0, 40.0, 29.0, 29.0, 17.0, 25.0, 21.0, 14.0, 15.0, 14.0, 10.0, 6.0, 7.0, 11.0, 4.0, 5.0, 4.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0011435151100158691, -0.0011076554656028748, -0.0010717958211898804, -0.001035936176776886, -0.0010000765323638916, -0.0009642168879508972, -0.0009283572435379028, -0.0008924975991249084, -0.0008566379547119141, -0.0008207783102989197, -0.0007849186658859253, -0.0007490590214729309, -0.0007131993770599365, -0.0006773397326469421, -0.0006414800882339478, -0.0006056204438209534, -0.000569760799407959, -0.0005339011549949646, -0.0004980415105819702, -0.00046218186616897583, -0.00042632222175598145, -0.00039046257734298706, -0.0003546029329299927, -0.0003187432885169983, -0.0002828836441040039, -0.0002470239996910095, -0.00021116435527801514, -0.00017530471086502075, -0.00013944506645202637, -0.00010358542203903198, -6.77257776260376e-05, -3.186613321304321e-05, 3.993511199951172e-06, 3.985315561294556e-05, 7.571280002593994e-05, 0.00011157244443893433, 0.0001474320888519287, 0.0001832917332649231, 0.00021915137767791748, 0.00025501102209091187, 0.00029087066650390625, 0.00032673031091690063, 0.000362589955329895, 0.0003984495997428894, 0.0004343092441558838, 0.0004701688885688782, 0.0005060285329818726, 0.0005418881773948669, 0.0005777478218078613, 0.0006136074662208557, 0.0006494671106338501, 0.0006853267550468445, 0.0007211863994598389, 0.0007570460438728333, 0.0007929056882858276, 0.000828765332698822, 0.0008646249771118164, 0.0009004846215248108, 0.0009363442659378052, 0.0009722039103507996, 0.001008063554763794, 0.0010439231991767883, 0.0010797828435897827, 0.001115642488002777, 0.0011515021324157715]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 9.0, 15.0, 18.0, 23.0, 29.0, 32.0, 26.0, 33.0, 42.0, 55.0, 42.0, 58.0, 52.0, 58.0, 53.0, 64.0, 56.0, 41.0, 50.0, 36.0, 34.0, 35.0, 23.0, 20.0, 20.0, 19.0, 15.0, 6.0, 8.0, 7.0, 5.0, 3.0, 5.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6953125, -12.2977294921875, -11.900146484375, -11.5025634765625, -11.10498046875, -10.7073974609375, -10.309814453125, -9.9122314453125, -9.5146484375, -9.1170654296875, -8.719482421875, -8.3218994140625, -7.92431640625, -7.5267333984375, -7.129150390625, -6.7315673828125, -6.333984375, -5.9364013671875, -5.538818359375, -5.1412353515625, -4.74365234375, -4.3460693359375, -3.948486328125, -3.5509033203125, -3.1533203125, -2.7557373046875, -2.358154296875, -1.9605712890625, -1.56298828125, -1.1654052734375, -0.767822265625, -0.3702392578125, 0.02734375, 0.4249267578125, 0.822509765625, 1.2200927734375, 1.61767578125, 2.0152587890625, 2.412841796875, 2.8104248046875, 3.2080078125, 3.6055908203125, 4.003173828125, 4.4007568359375, 4.79833984375, 5.1959228515625, 5.593505859375, 5.9910888671875, 6.388671875, 6.7862548828125, 7.183837890625, 7.5814208984375, 7.97900390625, 8.3765869140625, 8.774169921875, 9.1717529296875, 9.5693359375, 9.9669189453125, 10.364501953125, 10.7620849609375, 11.15966796875, 11.5572509765625, 11.954833984375, 12.3524169921875, 12.75]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 10.0, 11.0, 17.0, 22.0, 32.0, 51.0, 72.0, 98.0, 165.0, 243.0, 390.0, 667.0, 1273.0, 2339.0, 5300.0, 16791.0, 118303.0, 775776.0, 101478.0, 15533.0, 4839.0, 2205.0, 1189.0, 645.0, 399.0, 249.0, 143.0, 93.0, 58.0, 53.0, 34.0, 17.0, 17.0, 16.0, 8.0, 4.0, 3.0, 4.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.2578125, -11.8682861328125, -11.478759765625, -11.0892333984375, -10.69970703125, -10.3101806640625, -9.920654296875, -9.5311279296875, -9.1416015625, -8.7520751953125, -8.362548828125, -7.9730224609375, -7.58349609375, -7.1939697265625, -6.804443359375, -6.4149169921875, -6.025390625, -5.6358642578125, -5.246337890625, -4.8568115234375, -4.46728515625, -4.0777587890625, -3.688232421875, -3.2987060546875, -2.9091796875, -2.5196533203125, -2.130126953125, -1.7406005859375, -1.35107421875, -0.9615478515625, -0.572021484375, -0.1824951171875, 0.20703125, 0.5965576171875, 0.986083984375, 1.3756103515625, 1.76513671875, 2.1546630859375, 2.544189453125, 2.9337158203125, 3.3232421875, 3.7127685546875, 4.102294921875, 4.4918212890625, 4.88134765625, 5.2708740234375, 5.660400390625, 6.0499267578125, 6.439453125, 6.8289794921875, 7.218505859375, 7.6080322265625, 7.99755859375, 8.3870849609375, 8.776611328125, 9.1661376953125, 9.5556640625, 9.9451904296875, 10.334716796875, 10.7242431640625, 11.11376953125, 11.5032958984375, 11.892822265625, 12.2823486328125, 12.671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 8.0, 8.0, 9.0, 5.0, 7.0, 10.0, 10.0, 16.0, 27.0, 19.0, 20.0, 22.0, 27.0, 34.0, 37.0, 25.0, 39.0, 37.0, 46.0, 43.0, 76.0, 1975.0, 102.0, 37.0, 33.0, 40.0, 43.0, 32.0, 21.0, 34.0, 24.0, 22.0, 31.0, 14.0, 12.0, 18.0, 19.0, 13.0, 11.0, 9.0, 6.0, 9.0, 3.0, 3.0, 2.0, 2.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-32.90625, -31.861328125, -30.81640625, -29.771484375, -28.7265625, -27.681640625, -26.63671875, -25.591796875, -24.546875, -23.501953125, -22.45703125, -21.412109375, -20.3671875, -19.322265625, -18.27734375, -17.232421875, -16.1875, -15.142578125, -14.09765625, -13.052734375, -12.0078125, -10.962890625, -9.91796875, -8.873046875, -7.828125, -6.783203125, -5.73828125, -4.693359375, -3.6484375, -2.603515625, -1.55859375, -0.513671875, 0.53125, 1.576171875, 2.62109375, 3.666015625, 4.7109375, 5.755859375, 6.80078125, 7.845703125, 8.890625, 9.935546875, 10.98046875, 12.025390625, 13.0703125, 14.115234375, 15.16015625, 16.205078125, 17.25, 18.294921875, 19.33984375, 20.384765625, 21.4296875, 22.474609375, 23.51953125, 24.564453125, 25.609375, 26.654296875, 27.69921875, 28.744140625, 29.7890625, 30.833984375, 31.87890625, 32.923828125, 33.96875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 8.0, 3.0, 12.0, 6.0, 12.0, 19.0, 13.0, 17.0, 12.0, 23.0, 36.0, 30.0, 46.0, 58.0, 60.0, 110.0, 169.0, 263.0, 585.0, 2390.0, 36163.0, 3093800.0, 9211.0, 1424.0, 442.0, 231.0, 137.0, 80.0, 69.0, 48.0, 37.0, 31.0, 28.0, 18.0, 21.0, 20.0, 11.0, 7.0, 9.0, 5.0, 5.0, 8.0, 11.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0], "bins": [-55.0, -53.298828125, -51.59765625, -49.896484375, -48.1953125, -46.494140625, -44.79296875, -43.091796875, -41.390625, -39.689453125, -37.98828125, -36.287109375, -34.5859375, -32.884765625, -31.18359375, -29.482421875, -27.78125, -26.080078125, -24.37890625, -22.677734375, -20.9765625, -19.275390625, -17.57421875, -15.873046875, -14.171875, -12.470703125, -10.76953125, -9.068359375, -7.3671875, -5.666015625, -3.96484375, -2.263671875, -0.5625, 1.138671875, 2.83984375, 4.541015625, 6.2421875, 7.943359375, 9.64453125, 11.345703125, 13.046875, 14.748046875, 16.44921875, 18.150390625, 19.8515625, 21.552734375, 23.25390625, 24.955078125, 26.65625, 28.357421875, 30.05859375, 31.759765625, 33.4609375, 35.162109375, 36.86328125, 38.564453125, 40.265625, 41.966796875, 43.66796875, 45.369140625, 47.0703125, 48.771484375, 50.47265625, 52.173828125, 53.875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 51.0, 772.0, 192.0], "bins": [-347.86907958984375, -342.31597900390625, -336.76287841796875, -331.20977783203125, -325.65667724609375, -320.1036071777344, -314.5505065917969, -308.9974060058594, -303.4443054199219, -297.8912048339844, -292.3381042480469, -286.7850036621094, -281.23193359375, -275.6788330078125, -270.125732421875, -264.5726318359375, -259.01953125, -253.4664306640625, -247.913330078125, -242.36024475097656, -236.80714416503906, -231.25404357910156, -225.70095825195312, -220.14785766601562, -214.59475708007812, -209.04165649414062, -203.48855590820312, -197.9354705810547, -192.3823699951172, -186.8292694091797, -181.27618408203125, -175.72308349609375, -170.16998291015625, -164.61688232421875, -159.06378173828125, -153.5106964111328, -147.9575958251953, -142.4044952392578, -136.85140991210938, -131.29830932617188, -125.74520874023438, -120.19210815429688, -114.6390151977539, -109.08592224121094, -103.53282165527344, -97.97972106933594, -92.42662811279297, -86.87353515625, -81.3204345703125, -75.767333984375, -70.21424102783203, -64.66114807128906, -59.10804748535156, -53.55495071411133, -48.001853942871094, -42.44875717163086, -36.895660400390625, -31.34256362915039, -25.789466857910156, -20.236370086669922, -14.683273315429688, -9.130176544189453, -3.5770797729492188, 1.9760169982910156, 7.529114723205566]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 7.0, 7.0, 11.0, 12.0, 13.0, 20.0, 19.0, 24.0, 24.0, 12.0, 22.0, 26.0, 23.0, 36.0, 37.0, 46.0, 40.0, 39.0, 43.0, 38.0, 41.0, 37.0, 31.0, 38.0, 42.0, 29.0, 32.0, 35.0, 17.0, 20.0, 27.0, 20.0, 21.0, 18.0, 15.0, 18.0, 7.0, 5.0, 4.0, 7.0, 4.0, 7.0, 1.0, 3.0, 3.0, 0.0, 1.0, 6.0], "bins": [-117.0850601196289, -113.75557708740234, -110.42609405517578, -107.09660339355469, -103.76712036132812, -100.43763732910156, -97.108154296875, -93.77867126464844, -90.44918823242188, -87.11970520019531, -83.79022216796875, -80.46073913574219, -77.1312484741211, -73.80176544189453, -70.47228240966797, -67.1427993774414, -63.81330871582031, -60.48382568359375, -57.15433883666992, -53.82485580444336, -50.49536895751953, -47.16588592529297, -43.836402893066406, -40.506919860839844, -37.177433013916016, -33.84794998168945, -30.518463134765625, -27.188980102539062, -23.859495162963867, -20.530010223388672, -17.20052719116211, -13.871042251586914, -10.541549682617188, -7.21206521987915, -3.8825807571411133, -0.5530967712402344, 2.776388168334961, 6.105873107910156, 9.435356140136719, 12.764841079711914, 16.09432601928711, 19.423810958862305, 22.7532958984375, 26.082778930664062, 29.412263870239258, 32.74174880981445, 36.071231842041016, 39.400718688964844, 42.730201721191406, 46.05968475341797, 49.3891716003418, 52.71865463256836, 56.04814147949219, 59.37762451171875, 62.70710754394531, 66.03659057617188, 69.36607360839844, 72.695556640625, 76.02503967285156, 79.35452270507812, 82.68401336669922, 86.01349639892578, 89.34297943115234, 92.6724624633789, 96.001953125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 8.0, 13.0, 15.0, 24.0, 32.0, 25.0, 27.0, 39.0, 42.0, 51.0, 45.0, 51.0, 59.0, 58.0, 44.0, 63.0, 56.0, 40.0, 46.0, 42.0, 35.0, 25.0, 29.0, 27.0, 18.0, 18.0, 15.0, 11.0, 6.0, 7.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7109375, -12.314208984375, -11.91748046875, -11.520751953125, -11.1240234375, -10.727294921875, -10.33056640625, -9.933837890625, -9.537109375, -9.140380859375, -8.74365234375, -8.346923828125, -7.9501953125, -7.553466796875, -7.15673828125, -6.760009765625, -6.36328125, -5.966552734375, -5.56982421875, -5.173095703125, -4.7763671875, -4.379638671875, -3.98291015625, -3.586181640625, -3.189453125, -2.792724609375, -2.39599609375, -1.999267578125, -1.6025390625, -1.205810546875, -0.80908203125, -0.412353515625, -0.015625, 0.381103515625, 0.77783203125, 1.174560546875, 1.5712890625, 1.968017578125, 2.36474609375, 2.761474609375, 3.158203125, 3.554931640625, 3.95166015625, 4.348388671875, 4.7451171875, 5.141845703125, 5.53857421875, 5.935302734375, 6.33203125, 6.728759765625, 7.12548828125, 7.522216796875, 7.9189453125, 8.315673828125, 8.71240234375, 9.109130859375, 9.505859375, 9.902587890625, 10.29931640625, 10.696044921875, 11.0927734375, 11.489501953125, 11.88623046875, 12.282958984375, 12.6796875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 5.0, 8.0, 6.0, 7.0, 11.0, 23.0, 37.0, 49.0, 66.0, 117.0, 154.0, 380.0, 699.0, 1624.0, 4431.0, 18684.0, 1807072.0, 2328183.0, 24350.0, 4868.0, 1871.0, 808.0, 360.0, 191.0, 95.0, 61.0, 39.0, 24.0, 16.0, 12.0, 12.0, 9.0, 8.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.65625, -46.21337890625, -44.7705078125, -43.32763671875, -41.884765625, -40.44189453125, -38.9990234375, -37.55615234375, -36.11328125, -34.67041015625, -33.2275390625, -31.78466796875, -30.341796875, -28.89892578125, -27.4560546875, -26.01318359375, -24.5703125, -23.12744140625, -21.6845703125, -20.24169921875, -18.798828125, -17.35595703125, -15.9130859375, -14.47021484375, -13.02734375, -11.58447265625, -10.1416015625, -8.69873046875, -7.255859375, -5.81298828125, -4.3701171875, -2.92724609375, -1.484375, -0.04150390625, 1.4013671875, 2.84423828125, 4.287109375, 5.72998046875, 7.1728515625, 8.61572265625, 10.05859375, 11.50146484375, 12.9443359375, 14.38720703125, 15.830078125, 17.27294921875, 18.7158203125, 20.15869140625, 21.6015625, 23.04443359375, 24.4873046875, 25.93017578125, 27.373046875, 28.81591796875, 30.2587890625, 31.70166015625, 33.14453125, 34.58740234375, 36.0302734375, 37.47314453125, 38.916015625, 40.35888671875, 41.8017578125, 43.24462890625, 44.6875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 7.0, 1.0, 0.0, 0.0, 4.0, 10.0, 5.0, 3.0, 11.0, 8.0, 21.0, 36.0, 40.0, 72.0, 182.0, 413.0, 820.0, 1057.0, 710.0, 346.0, 149.0, 57.0, 45.0, 19.0, 23.0, 7.0, 6.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.625, -44.36962890625, -43.1142578125, -41.85888671875, -40.603515625, -39.34814453125, -38.0927734375, -36.83740234375, -35.58203125, -34.32666015625, -33.0712890625, -31.81591796875, -30.560546875, -29.30517578125, -28.0498046875, -26.79443359375, -25.5390625, -24.28369140625, -23.0283203125, -21.77294921875, -20.517578125, -19.26220703125, -18.0068359375, -16.75146484375, -15.49609375, -14.24072265625, -12.9853515625, -11.72998046875, -10.474609375, -9.21923828125, -7.9638671875, -6.70849609375, -5.453125, -4.19775390625, -2.9423828125, -1.68701171875, -0.431640625, 0.82373046875, 2.0791015625, 3.33447265625, 4.58984375, 5.84521484375, 7.1005859375, 8.35595703125, 9.611328125, 10.86669921875, 12.1220703125, 13.37744140625, 14.6328125, 15.88818359375, 17.1435546875, 18.39892578125, 19.654296875, 20.90966796875, 22.1650390625, 23.42041015625, 24.67578125, 25.93115234375, 27.1865234375, 28.44189453125, 29.697265625, 30.95263671875, 32.2080078125, 33.46337890625, 34.71875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 9.0, 13.0, 13.0, 33.0, 48.0, 66.0, 130.0, 218.0, 408.0, 818.0, 1590.0, 3201.0, 7629.0, 22451.0, 143247.0, 3708148.0, 261608.0, 28307.0, 8968.0, 3682.0, 1717.0, 914.0, 473.0, 224.0, 152.0, 61.0, 60.0, 39.0, 13.0, 12.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.5, -49.75927734375, -48.0185546875, -46.27783203125, -44.537109375, -42.79638671875, -41.0556640625, -39.31494140625, -37.57421875, -35.83349609375, -34.0927734375, -32.35205078125, -30.611328125, -28.87060546875, -27.1298828125, -25.38916015625, -23.6484375, -21.90771484375, -20.1669921875, -18.42626953125, -16.685546875, -14.94482421875, -13.2041015625, -11.46337890625, -9.72265625, -7.98193359375, -6.2412109375, -4.50048828125, -2.759765625, -1.01904296875, 0.7216796875, 2.46240234375, 4.203125, 5.94384765625, 7.6845703125, 9.42529296875, 11.166015625, 12.90673828125, 14.6474609375, 16.38818359375, 18.12890625, 19.86962890625, 21.6103515625, 23.35107421875, 25.091796875, 26.83251953125, 28.5732421875, 30.31396484375, 32.0546875, 33.79541015625, 35.5361328125, 37.27685546875, 39.017578125, 40.75830078125, 42.4990234375, 44.23974609375, 45.98046875, 47.72119140625, 49.4619140625, 51.20263671875, 52.943359375, 54.68408203125, 56.4248046875, 58.16552734375, 59.90625]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 9.0, 13.0, 31.0, 95.0, 232.0, 384.0, 144.0, 66.0, 23.0, 10.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-79.8553237915039, -70.20564270019531, -60.55596160888672, -50.90628433227539, -41.2566032409668, -31.606922149658203, -21.957244873046875, -12.307563781738281, -2.6578826904296875, 6.99179744720459, 16.641477584838867, 26.291156768798828, 35.94083786010742, 45.590518951416016, 55.240196228027344, 64.88987731933594, 74.53955841064453, 84.18923950195312, 93.83892059326172, 103.48860168457031, 113.13827514648438, 122.7879638671875, 132.43763732910156, 142.08731079101562, 151.73699951171875, 161.3866729736328, 171.03636169433594, 180.68603515625, 190.33572387695312, 199.9853973388672, 209.63507080078125, 219.28475952148438, 228.93441772460938, 238.58409118652344, 248.23377990722656, 257.8834533691406, 267.53314208984375, 277.1828308105469, 286.8324890136719, 296.482177734375, 306.1318664550781, 315.78155517578125, 325.43121337890625, 335.0809020996094, 344.7305908203125, 354.3802795410156, 364.0299377441406, 373.67962646484375, 383.32928466796875, 392.9789733886719, 402.6286315917969, 412.2783203125, 421.9280090332031, 431.57769775390625, 441.22735595703125, 450.8770446777344, 460.5267333984375, 470.1764221191406, 479.8260803222656, 489.47576904296875, 499.1254577636719, 508.775146484375, 518.4248046875, 528.074462890625, 537.7241821289062]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 4.0, 6.0, 15.0, 6.0, 14.0, 13.0, 16.0, 16.0, 19.0, 19.0, 22.0, 25.0, 37.0, 28.0, 34.0, 37.0, 30.0, 45.0, 43.0, 27.0, 38.0, 21.0, 41.0, 36.0, 37.0, 30.0, 27.0, 29.0, 30.0, 26.0, 38.0, 33.0, 19.0, 18.0, 21.0, 21.0, 10.0, 12.0, 14.0, 3.0, 10.0, 6.0, 8.0, 1.0, 6.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-74.33089447021484, -71.9674072265625, -69.60391235351562, -67.24042510986328, -64.8769302368164, -62.51344299316406, -60.14995193481445, -57.786460876464844, -55.422969818115234, -53.059478759765625, -50.695987701416016, -48.332496643066406, -45.96900939941406, -43.60551452636719, -41.242027282714844, -38.878536224365234, -36.515045166015625, -34.151554107666016, -31.788063049316406, -29.42457389831543, -27.06108283996582, -24.69759178161621, -22.334102630615234, -19.970611572265625, -17.607120513916016, -15.243629455566406, -12.880139350891113, -10.51664924621582, -8.153158187866211, -5.789667129516602, -3.4261770248413086, -1.0626869201660156, 1.3007965087890625, 3.6642870903015137, 6.027777671813965, 8.391267776489258, 10.754758834838867, 13.118249893188477, 15.48173999786377, 17.845230102539062, 20.208721160888672, 22.57221221923828, 24.93570327758789, 27.299192428588867, 29.662683486938477, 32.02617645263672, 34.38966369628906, 36.75315475463867, 39.11664581298828, 41.48013687133789, 43.8436279296875, 46.20711898803711, 48.57061004638672, 50.93409729003906, 53.29758834838867, 55.66107940673828, 58.02457046508789, 60.3880615234375, 62.75155258178711, 65.11504364013672, 67.47853088378906, 69.84202575683594, 72.20551300048828, 74.56900024414062, 76.9324951171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 10.0, 13.0, 13.0, 18.0, 20.0, 26.0, 23.0, 22.0, 50.0, 34.0, 44.0, 44.0, 52.0, 74.0, 53.0, 57.0, 60.0, 40.0, 34.0, 52.0, 44.0, 32.0, 25.0, 32.0, 29.0, 23.0, 17.0, 12.0, 12.0, 8.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.368896484375, -12.96435546875, -12.559814453125, -12.1552734375, -11.750732421875, -11.34619140625, -10.941650390625, -10.537109375, -10.132568359375, -9.72802734375, -9.323486328125, -8.9189453125, -8.514404296875, -8.10986328125, -7.705322265625, -7.30078125, -6.896240234375, -6.49169921875, -6.087158203125, -5.6826171875, -5.278076171875, -4.87353515625, -4.468994140625, -4.064453125, -3.659912109375, -3.25537109375, -2.850830078125, -2.4462890625, -2.041748046875, -1.63720703125, -1.232666015625, -0.828125, -0.423583984375, -0.01904296875, 0.385498046875, 0.7900390625, 1.194580078125, 1.59912109375, 2.003662109375, 2.408203125, 2.812744140625, 3.21728515625, 3.621826171875, 4.0263671875, 4.430908203125, 4.83544921875, 5.239990234375, 5.64453125, 6.049072265625, 6.45361328125, 6.858154296875, 7.2626953125, 7.667236328125, 8.07177734375, 8.476318359375, 8.880859375, 9.285400390625, 9.68994140625, 10.094482421875, 10.4990234375, 10.903564453125, 11.30810546875, 11.712646484375, 12.1171875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 10.0, 14.0, 24.0, 39.0, 61.0, 98.0, 182.0, 265.0, 385.0, 674.0, 1030.0, 1806.0, 3144.0, 5558.0, 10104.0, 18516.0, 34611.0, 69015.0, 155969.0, 338005.0, 219996.0, 92389.0, 44494.0, 23111.0, 12598.0, 6961.0, 3864.0, 2264.0, 1285.0, 800.0, 477.0, 275.0, 195.0, 115.0, 66.0, 47.0, 34.0, 26.0, 15.0, 9.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.240234375, -1.2010955810546875, -1.161956787109375, -1.1228179931640625, -1.08367919921875, -1.0445404052734375, -1.005401611328125, -0.9662628173828125, -0.9271240234375, -0.8879852294921875, -0.848846435546875, -0.8097076416015625, -0.77056884765625, -0.7314300537109375, -0.692291259765625, -0.6531524658203125, -0.614013671875, -0.5748748779296875, -0.535736083984375, -0.4965972900390625, -0.45745849609375, -0.4183197021484375, -0.379180908203125, -0.3400421142578125, -0.3009033203125, -0.2617645263671875, -0.222625732421875, -0.1834869384765625, -0.14434814453125, -0.1052093505859375, -0.066070556640625, -0.0269317626953125, 0.01220703125, 0.0513458251953125, 0.090484619140625, 0.1296234130859375, 0.16876220703125, 0.2079010009765625, 0.247039794921875, 0.2861785888671875, 0.3253173828125, 0.3644561767578125, 0.403594970703125, 0.4427337646484375, 0.48187255859375, 0.5210113525390625, 0.560150146484375, 0.5992889404296875, 0.638427734375, 0.6775665283203125, 0.716705322265625, 0.7558441162109375, 0.79498291015625, 0.8341217041015625, 0.873260498046875, 0.9123992919921875, 0.9515380859375, 0.9906768798828125, 1.029815673828125, 1.0689544677734375, 1.10809326171875, 1.1472320556640625, 1.186370849609375, 1.2255096435546875, 1.2646484375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 7.0, 5.0, 12.0, 5.0, 10.0, 10.0, 11.0, 21.0, 15.0, 16.0, 26.0, 24.0, 29.0, 32.0, 30.0, 24.0, 32.0, 28.0, 26.0, 31.0, 39.0, 32.0, 39.0, 1056.0, 30.0, 30.0, 29.0, 34.0, 30.0, 25.0, 38.0, 26.0, 33.0, 18.0, 24.0, 20.0, 18.0, 15.0, 13.0, 14.0, 13.0, 10.0, 11.0, 9.0, 2.0, 5.0, 5.0, 8.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-5.296875, -5.11749267578125, -4.9381103515625, -4.75872802734375, -4.579345703125, -4.39996337890625, -4.2205810546875, -4.04119873046875, -3.86181640625, -3.68243408203125, -3.5030517578125, -3.32366943359375, -3.144287109375, -2.96490478515625, -2.7855224609375, -2.60614013671875, -2.4267578125, -2.24737548828125, -2.0679931640625, -1.88861083984375, -1.709228515625, -1.52984619140625, -1.3504638671875, -1.17108154296875, -0.99169921875, -0.81231689453125, -0.6329345703125, -0.45355224609375, -0.274169921875, -0.09478759765625, 0.0845947265625, 0.26397705078125, 0.443359375, 0.62274169921875, 0.8021240234375, 0.98150634765625, 1.160888671875, 1.34027099609375, 1.5196533203125, 1.69903564453125, 1.87841796875, 2.05780029296875, 2.2371826171875, 2.41656494140625, 2.595947265625, 2.77532958984375, 2.9547119140625, 3.13409423828125, 3.3134765625, 3.49285888671875, 3.6722412109375, 3.85162353515625, 4.031005859375, 4.21038818359375, 4.3897705078125, 4.56915283203125, 4.74853515625, 4.92791748046875, 5.1072998046875, 5.28668212890625, 5.466064453125, 5.64544677734375, 5.8248291015625, 6.00421142578125, 6.18359375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 5.0, 13.0, 6.0, 17.0, 30.0, 29.0, 47.0, 66.0, 82.0, 163.0, 240.0, 326.0, 536.0, 816.0, 1293.0, 2119.0, 3546.0, 5696.0, 9056.0, 14970.0, 25782.0, 43802.0, 79473.0, 154233.0, 1324730.0, 199372.0, 98840.0, 54167.0, 31041.0, 18147.0, 10904.0, 6547.0, 4032.0, 2569.0, 1570.0, 1021.0, 654.0, 376.0, 264.0, 175.0, 113.0, 89.0, 52.0, 37.0, 31.0, 23.0, 11.0, 9.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0], "bins": [-1.1005859375, -1.06884765625, -1.037109375, -1.00537109375, -0.9736328125, -0.94189453125, -0.91015625, -0.87841796875, -0.8466796875, -0.81494140625, -0.783203125, -0.75146484375, -0.7197265625, -0.68798828125, -0.65625, -0.62451171875, -0.5927734375, -0.56103515625, -0.529296875, -0.49755859375, -0.4658203125, -0.43408203125, -0.40234375, -0.37060546875, -0.3388671875, -0.30712890625, -0.275390625, -0.24365234375, -0.2119140625, -0.18017578125, -0.1484375, -0.11669921875, -0.0849609375, -0.05322265625, -0.021484375, 0.01025390625, 0.0419921875, 0.07373046875, 0.10546875, 0.13720703125, 0.1689453125, 0.20068359375, 0.232421875, 0.26416015625, 0.2958984375, 0.32763671875, 0.359375, 0.39111328125, 0.4228515625, 0.45458984375, 0.486328125, 0.51806640625, 0.5498046875, 0.58154296875, 0.61328125, 0.64501953125, 0.6767578125, 0.70849609375, 0.740234375, 0.77197265625, 0.8037109375, 0.83544921875, 0.8671875, 0.89892578125, 0.9306640625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 3.0, 3.0, 4.0, 10.0, 7.0, 11.0, 14.0, 12.0, 16.0, 22.0, 15.0, 25.0, 31.0, 29.0, 40.0, 45.0, 47.0, 61.0, 59.0, 56.0, 46.0, 60.0, 45.0, 44.0, 43.0, 49.0, 32.0, 34.0, 25.0, 23.0, 17.0, 12.0, 11.0, 8.0, 11.0, 9.0, 6.0, 8.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00196075439453125, -0.0018971562385559082, -0.0018335580825805664, -0.0017699599266052246, -0.0017063617706298828, -0.001642763614654541, -0.0015791654586791992, -0.0015155673027038574, -0.0014519691467285156, -0.0013883709907531738, -0.001324772834777832, -0.0012611746788024902, -0.0011975765228271484, -0.0011339783668518066, -0.0010703802108764648, -0.001006782054901123, -0.0009431838989257812, -0.0008795857429504395, -0.0008159875869750977, -0.0007523894309997559, -0.0006887912750244141, -0.0006251931190490723, -0.0005615949630737305, -0.0004979968070983887, -0.0004343986511230469, -0.0003708004951477051, -0.0003072023391723633, -0.00024360418319702148, -0.0001800060272216797, -0.00011640787124633789, -5.2809715270996094e-05, 1.0788440704345703e-05, 7.43865966796875e-05, 0.0001379847526550293, 0.0002015829086303711, 0.0002651810646057129, 0.0003287792205810547, 0.0003923773765563965, 0.0004559755325317383, 0.0005195736885070801, 0.0005831718444824219, 0.0006467700004577637, 0.0007103681564331055, 0.0007739663124084473, 0.0008375644683837891, 0.0009011626243591309, 0.0009647607803344727, 0.0010283589363098145, 0.0010919570922851562, 0.001155555248260498, 0.0012191534042358398, 0.0012827515602111816, 0.0013463497161865234, 0.0014099478721618652, 0.001473546028137207, 0.0015371441841125488, 0.0016007423400878906, 0.0016643404960632324, 0.0017279386520385742, 0.001791536808013916, 0.0018551349639892578, 0.0019187331199645996, 0.0019823312759399414, 0.002045929431915283, 0.002109527587890625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 2.0, 10.0, 6.0, 4.0, 13.0, 14.0, 18.0, 22.0, 27.0, 44.0, 49.0, 64.0, 96.0, 132.0, 149.0, 209.0, 323.0, 673.0, 8932.0, 956482.0, 78716.0, 1227.0, 406.0, 245.0, 159.0, 129.0, 83.0, 82.0, 51.0, 52.0, 30.0, 29.0, 18.0, 14.0, 12.0, 7.0, 6.0, 3.0, 4.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.04119873046875, -0.039938926696777344, -0.03867912292480469, -0.03741931915283203, -0.036159515380859375, -0.03489971160888672, -0.03363990783691406, -0.032380104064941406, -0.03112030029296875, -0.029860496520996094, -0.028600692749023438, -0.02734088897705078, -0.026081085205078125, -0.02482128143310547, -0.023561477661132812, -0.022301673889160156, -0.0210418701171875, -0.019782066345214844, -0.018522262573242188, -0.01726245880126953, -0.016002655029296875, -0.014742851257324219, -0.013483047485351562, -0.012223243713378906, -0.01096343994140625, -0.009703636169433594, -0.008443832397460938, -0.007184028625488281, -0.005924224853515625, -0.004664421081542969, -0.0034046173095703125, -0.0021448135375976562, -0.000885009765625, 0.00037479400634765625, 0.0016345977783203125, 0.0028944015502929688, 0.004154205322265625, 0.005414009094238281, 0.0066738128662109375, 0.007933616638183594, 0.00919342041015625, 0.010453224182128906, 0.011713027954101562, 0.012972831726074219, 0.014232635498046875, 0.015492439270019531, 0.016752243041992188, 0.018012046813964844, 0.0192718505859375, 0.020531654357910156, 0.021791458129882812, 0.02305126190185547, 0.024311065673828125, 0.02557086944580078, 0.026830673217773438, 0.028090476989746094, 0.02935028076171875, 0.030610084533691406, 0.03186988830566406, 0.03312969207763672, 0.034389495849609375, 0.03564929962158203, 0.03690910339355469, 0.038168907165527344, 0.0394287109375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 20.0, 77.0, 215.0, 361.0, 224.0, 77.0, 24.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023426932748407125, -0.0022011171095073223, -0.002059540944173932, -0.0019179648952558637, -0.0017763887299224734, -0.0016348125645890832, -0.0014932365156710148, -0.0013516603503376245, -0.0012100841850042343, -0.001068508019670844, -0.0009269319125451148, -0.0007853558054193854, -0.0006437796400859952, -0.000502203474752605, -0.00036062736762687564, -0.00021905126050114632, -7.747509516775608e-05, 6.41010410618037e-05, 0.00020567717729136348, 0.00034725331352092326, 0.000488829449750483, 0.0006304056150838733, 0.0007719817222096026, 0.0009135578293353319, 0.0010551339946687222, 0.0011967101600021124, 0.0013382863253355026, 0.001479862374253571, 0.0016214385395869613, 0.0017630147049203515, 0.00190459075383842, 0.00204616691917181, 0.002187743317335844, 0.0023293194826692343, 0.0024708956480026245, 0.0026124718133360147, 0.002754047978669405, 0.0028956239111721516, 0.003037200076505542, 0.003178776241838932, 0.0033203524071723223, 0.0034619285725057125, 0.0036035047378391027, 0.003745080903172493, 0.0038866568356752396, 0.0040282332338392735, 0.00416980916634202, 0.004311385564506054, 0.0044529614970088005, 0.004594537429511547, 0.004736113827675581, 0.0048776897601783276, 0.0050192661583423615, 0.005160842090845108, 0.005302418489009142, 0.0054439944215118885, 0.005585570819675922, 0.005727146752178669, 0.005868723150342703, 0.0060102990828454494, 0.006151875481009483, 0.00629345141351223, 0.006435027811676264, 0.00657660374417901, 0.006718179676681757]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 7.0, 4.0, 7.0, 12.0, 7.0, 9.0, 17.0, 14.0, 23.0, 22.0, 20.0, 25.0, 32.0, 30.0, 40.0, 31.0, 41.0, 41.0, 46.0, 30.0, 52.0, 42.0, 49.0, 44.0, 40.0, 58.0, 34.0, 20.0, 25.0, 32.0, 20.0, 16.0, 12.0, 19.0, 23.0, 11.0, 13.0, 10.0, 7.0, 11.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010796785354614258, -0.0010438775643706322, -0.0010080765932798386, -0.000972275622189045, -0.0009364746510982513, -0.0009006736800074577, -0.0008648727089166641, -0.0008290717378258705, -0.0007932707667350769, -0.0007574697956442833, -0.0007216688245534897, -0.0006858678534626961, -0.0006500668823719025, -0.0006142659112811089, -0.0005784649401903152, -0.0005426639690995216, -0.000506862998008728, -0.0004710620269179344, -0.0004352610558271408, -0.0003994600847363472, -0.0003636591136455536, -0.00032785814255476, -0.00029205717146396637, -0.00025625620037317276, -0.00022045522928237915, -0.00018465425819158554, -0.00014885328710079193, -0.00011305231600999832, -7.725134491920471e-05, -4.14503738284111e-05, -5.649402737617493e-06, 3.0151568353176117e-05, 6.595253944396973e-05, 0.00010175351053476334, 0.00013755448162555695, 0.00017335545271635056, 0.00020915642380714417, 0.0002449573948979378, 0.0002807583659887314, 0.000316559337079525, 0.0003523603081703186, 0.0003881612792611122, 0.0004239622503519058, 0.00045976322144269943, 0.000495564192533493, 0.0005313651636242867, 0.0005671661347150803, 0.0006029671058058739, 0.0006387680768966675, 0.0006745690479874611, 0.0007103700190782547, 0.0007461709901690483, 0.0007819719612598419, 0.0008177729323506355, 0.0008535739034414291, 0.0008893748745322227, 0.0009251758456230164, 0.00096097681671381, 0.0009967777878046036, 0.0010325787588953972, 0.0010683797299861908, 0.0011041807010769844, 0.001139981672167778, 0.0011757826432585716, 0.0012115836143493652]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 2.0, 6.0, 10.0, 13.0, 13.0, 18.0, 20.0, 26.0, 23.0, 22.0, 50.0, 34.0, 44.0, 44.0, 52.0, 74.0, 53.0, 57.0, 60.0, 40.0, 34.0, 52.0, 44.0, 32.0, 25.0, 32.0, 29.0, 23.0, 17.0, 12.0, 12.0, 8.0, 3.0, 6.0, 5.0, 2.0, 2.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7734375, -13.368896484375, -12.96435546875, -12.559814453125, -12.1552734375, -11.750732421875, -11.34619140625, -10.941650390625, -10.537109375, -10.132568359375, -9.72802734375, -9.323486328125, -8.9189453125, -8.514404296875, -8.10986328125, -7.705322265625, -7.30078125, -6.896240234375, -6.49169921875, -6.087158203125, -5.6826171875, -5.278076171875, -4.87353515625, -4.468994140625, -4.064453125, -3.659912109375, -3.25537109375, -2.850830078125, -2.4462890625, -2.041748046875, -1.63720703125, -1.232666015625, -0.828125, -0.423583984375, -0.01904296875, 0.385498046875, 0.7900390625, 1.194580078125, 1.59912109375, 2.003662109375, 2.408203125, 2.812744140625, 3.21728515625, 3.621826171875, 4.0263671875, 4.430908203125, 4.83544921875, 5.239990234375, 5.64453125, 6.049072265625, 6.45361328125, 6.858154296875, 7.2626953125, 7.667236328125, 8.07177734375, 8.476318359375, 8.880859375, 9.285400390625, 9.68994140625, 10.094482421875, 10.4990234375, 10.903564453125, 11.30810546875, 11.712646484375, 12.1171875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 0.0, 6.0, 7.0, 15.0, 13.0, 29.0, 44.0, 49.0, 73.0, 103.0, 158.0, 246.0, 332.0, 586.0, 1057.0, 2073.0, 4310.0, 11455.0, 44646.0, 278559.0, 581210.0, 91530.0, 19528.0, 6368.0, 2750.0, 1384.0, 699.0, 454.0, 283.0, 215.0, 129.0, 78.0, 44.0, 31.0, 28.0, 14.0, 15.0, 12.0, 7.0, 5.0, 4.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.1171875, -8.8507080078125, -8.584228515625, -8.3177490234375, -8.05126953125, -7.7847900390625, -7.518310546875, -7.2518310546875, -6.9853515625, -6.7188720703125, -6.452392578125, -6.1859130859375, -5.91943359375, -5.6529541015625, -5.386474609375, -5.1199951171875, -4.853515625, -4.5870361328125, -4.320556640625, -4.0540771484375, -3.78759765625, -3.5211181640625, -3.254638671875, -2.9881591796875, -2.7216796875, -2.4552001953125, -2.188720703125, -1.9222412109375, -1.65576171875, -1.3892822265625, -1.122802734375, -0.8563232421875, -0.58984375, -0.3233642578125, -0.056884765625, 0.2095947265625, 0.47607421875, 0.7425537109375, 1.009033203125, 1.2755126953125, 1.5419921875, 1.8084716796875, 2.074951171875, 2.3414306640625, 2.60791015625, 2.8743896484375, 3.140869140625, 3.4073486328125, 3.673828125, 3.9403076171875, 4.206787109375, 4.4732666015625, 4.73974609375, 5.0062255859375, 5.272705078125, 5.5391845703125, 5.8056640625, 6.0721435546875, 6.338623046875, 6.6051025390625, 6.87158203125, 7.1380615234375, 7.404541015625, 7.6710205078125, 7.9375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 2.0, 10.0, 5.0, 10.0, 12.0, 17.0, 25.0, 16.0, 27.0, 26.0, 25.0, 25.0, 27.0, 25.0, 34.0, 36.0, 50.0, 43.0, 98.0, 1860.0, 185.0, 52.0, 62.0, 36.0, 39.0, 44.0, 35.0, 37.0, 19.0, 21.0, 23.0, 18.0, 17.0, 17.0, 6.0, 9.0, 6.0, 12.0, 11.0, 7.0, 9.0, 0.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-35.75, -34.6552734375, -33.560546875, -32.4658203125, -31.37109375, -30.2763671875, -29.181640625, -28.0869140625, -26.9921875, -25.8974609375, -24.802734375, -23.7080078125, -22.61328125, -21.5185546875, -20.423828125, -19.3291015625, -18.234375, -17.1396484375, -16.044921875, -14.9501953125, -13.85546875, -12.7607421875, -11.666015625, -10.5712890625, -9.4765625, -8.3818359375, -7.287109375, -6.1923828125, -5.09765625, -4.0029296875, -2.908203125, -1.8134765625, -0.71875, 0.3759765625, 1.470703125, 2.5654296875, 3.66015625, 4.7548828125, 5.849609375, 6.9443359375, 8.0390625, 9.1337890625, 10.228515625, 11.3232421875, 12.41796875, 13.5126953125, 14.607421875, 15.7021484375, 16.796875, 17.8916015625, 18.986328125, 20.0810546875, 21.17578125, 22.2705078125, 23.365234375, 24.4599609375, 25.5546875, 26.6494140625, 27.744140625, 28.8388671875, 29.93359375, 31.0283203125, 32.123046875, 33.2177734375, 34.3125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 1.0, 6.0, 10.0, 11.0, 11.0, 7.0, 6.0, 12.0, 15.0, 21.0, 19.0, 29.0, 26.0, 36.0, 70.0, 73.0, 122.0, 144.0, 251.0, 537.0, 1816.0, 73459.0, 3062130.0, 5055.0, 796.0, 331.0, 209.0, 125.0, 80.0, 54.0, 37.0, 35.0, 34.0, 22.0, 22.0, 27.0, 15.0, 13.0, 9.0, 5.0, 9.0, 3.0, 5.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-57.46875, -55.62841796875, -53.7880859375, -51.94775390625, -50.107421875, -48.26708984375, -46.4267578125, -44.58642578125, -42.74609375, -40.90576171875, -39.0654296875, -37.22509765625, -35.384765625, -33.54443359375, -31.7041015625, -29.86376953125, -28.0234375, -26.18310546875, -24.3427734375, -22.50244140625, -20.662109375, -18.82177734375, -16.9814453125, -15.14111328125, -13.30078125, -11.46044921875, -9.6201171875, -7.77978515625, -5.939453125, -4.09912109375, -2.2587890625, -0.41845703125, 1.421875, 3.26220703125, 5.1025390625, 6.94287109375, 8.783203125, 10.62353515625, 12.4638671875, 14.30419921875, 16.14453125, 17.98486328125, 19.8251953125, 21.66552734375, 23.505859375, 25.34619140625, 27.1865234375, 29.02685546875, 30.8671875, 32.70751953125, 34.5478515625, 36.38818359375, 38.228515625, 40.06884765625, 41.9091796875, 43.74951171875, 45.58984375, 47.43017578125, 49.2705078125, 51.11083984375, 52.951171875, 54.79150390625, 56.6318359375, 58.47216796875, 60.3125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 169.0, 774.0, 69.0, 1.0], "bins": [-341.38720703125, -335.8251953125, -330.2631530761719, -324.7011413574219, -319.13909912109375, -313.57708740234375, -308.0150451660156, -302.4530334472656, -296.8909912109375, -291.3289794921875, -285.7669372558594, -280.2049255371094, -274.64288330078125, -269.08087158203125, -263.5188293457031, -257.9568176269531, -252.39479064941406, -246.832763671875, -241.27073669433594, -235.70870971679688, -230.1466827392578, -224.58465576171875, -219.02264404296875, -213.46060180664062, -207.89859008789062, -202.33656311035156, -196.7745361328125, -191.21250915527344, -185.65048217773438, -180.0884552001953, -174.52642822265625, -168.96441650390625, -163.4023895263672, -157.84036254882812, -152.27833557128906, -146.71630859375, -141.15428161621094, -135.59225463867188, -130.03024291992188, -124.46820831298828, -118.90618133544922, -113.34415435791016, -107.7821273803711, -102.22010803222656, -96.6580810546875, -91.09605407714844, -85.53402709960938, -79.97200012207031, -74.40997314453125, -68.84794616699219, -63.285919189453125, -57.72389602661133, -52.161869049072266, -46.5998420715332, -41.037818908691406, -35.475791931152344, -29.91376495361328, -24.35173797607422, -18.78971290588379, -13.22768783569336, -7.665660858154297, -2.1036338806152344, 3.4583892822265625, 9.020416259765625, 14.582443237304688]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 9.0, 7.0, 14.0, 10.0, 8.0, 12.0, 18.0, 18.0, 24.0, 28.0, 30.0, 20.0, 24.0, 44.0, 34.0, 29.0, 43.0, 35.0, 37.0, 47.0, 32.0, 43.0, 46.0, 52.0, 44.0, 48.0, 35.0, 33.0, 27.0, 34.0, 26.0, 13.0, 10.0, 17.0, 9.0, 9.0, 4.0, 8.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.63573455810547, -104.0561294555664, -100.47652435302734, -96.89691925048828, -93.31731414794922, -89.73770904541016, -86.15809631347656, -82.5784912109375, -78.99888610839844, -75.41928100585938, -71.83967590332031, -68.26007080078125, -64.68046569824219, -61.100860595703125, -57.5212516784668, -53.941646575927734, -50.36204528808594, -46.782440185546875, -43.20283508300781, -39.62322998046875, -36.04362487792969, -32.464019775390625, -28.884410858154297, -25.304805755615234, -21.725200653076172, -18.14559555053711, -14.56598949432373, -10.986383438110352, -7.406778335571289, -3.8271732330322266, -0.24756622314453125, 3.3320388793945312, 6.911643981933594, 10.491249084472656, 14.070855140686035, 17.650461196899414, 21.230066299438477, 24.80967140197754, 28.389278411865234, 31.968883514404297, 35.54848861694336, 39.12809371948242, 42.707698822021484, 46.28730773925781, 49.866912841796875, 53.44651794433594, 57.026123046875, 60.60572814941406, 64.18533325195312, 67.76493835449219, 71.34454345703125, 74.92414855957031, 78.50375366210938, 82.08335876464844, 85.6629638671875, 89.24256896972656, 92.82217407226562, 96.40177917480469, 99.98138427734375, 103.56098937988281, 107.14059448242188, 110.72019958496094, 114.2998046875, 117.87940979003906, 121.45902252197266]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 12.0, 16.0, 11.0, 20.0, 24.0, 17.0, 21.0, 30.0, 47.0, 33.0, 45.0, 52.0, 47.0, 60.0, 60.0, 59.0, 60.0, 42.0, 38.0, 39.0, 50.0, 29.0, 33.0, 28.0, 24.0, 24.0, 21.0, 8.0, 15.0, 6.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.546875, -13.136962890625, -12.72705078125, -12.317138671875, -11.9072265625, -11.497314453125, -11.08740234375, -10.677490234375, -10.267578125, -9.857666015625, -9.44775390625, -9.037841796875, -8.6279296875, -8.218017578125, -7.80810546875, -7.398193359375, -6.98828125, -6.578369140625, -6.16845703125, -5.758544921875, -5.3486328125, -4.938720703125, -4.52880859375, -4.118896484375, -3.708984375, -3.299072265625, -2.88916015625, -2.479248046875, -2.0693359375, -1.659423828125, -1.24951171875, -0.839599609375, -0.4296875, -0.019775390625, 0.39013671875, 0.800048828125, 1.2099609375, 1.619873046875, 2.02978515625, 2.439697265625, 2.849609375, 3.259521484375, 3.66943359375, 4.079345703125, 4.4892578125, 4.899169921875, 5.30908203125, 5.718994140625, 6.12890625, 6.538818359375, 6.94873046875, 7.358642578125, 7.7685546875, 8.178466796875, 8.58837890625, 8.998291015625, 9.408203125, 9.818115234375, 10.22802734375, 10.637939453125, 11.0478515625, 11.457763671875, 11.86767578125, 12.277587890625, 12.6875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 9.0, 11.0, 10.0, 24.0, 18.0, 35.0, 36.0, 51.0, 65.0, 160.0, 292.0, 610.0, 1504.0, 4049.0, 16847.0, 1737680.0, 2402816.0, 22585.0, 4399.0, 1632.0, 680.0, 327.0, 163.0, 85.0, 50.0, 41.0, 29.0, 18.0, 18.0, 7.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.3125, -50.72900390625, -49.1455078125, -47.56201171875, -45.978515625, -44.39501953125, -42.8115234375, -41.22802734375, -39.64453125, -38.06103515625, -36.4775390625, -34.89404296875, -33.310546875, -31.72705078125, -30.1435546875, -28.56005859375, -26.9765625, -25.39306640625, -23.8095703125, -22.22607421875, -20.642578125, -19.05908203125, -17.4755859375, -15.89208984375, -14.30859375, -12.72509765625, -11.1416015625, -9.55810546875, -7.974609375, -6.39111328125, -4.8076171875, -3.22412109375, -1.640625, -0.05712890625, 1.5263671875, 3.10986328125, 4.693359375, 6.27685546875, 7.8603515625, 9.44384765625, 11.02734375, 12.61083984375, 14.1943359375, 15.77783203125, 17.361328125, 18.94482421875, 20.5283203125, 22.11181640625, 23.6953125, 25.27880859375, 26.8623046875, 28.44580078125, 30.029296875, 31.61279296875, 33.1962890625, 34.77978515625, 36.36328125, 37.94677734375, 39.5302734375, 41.11376953125, 42.697265625, 44.28076171875, 45.8642578125, 47.44775390625, 49.03125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 5.0, 2.0, 5.0, 10.0, 7.0, 10.0, 17.0, 28.0, 32.0, 94.0, 167.0, 369.0, 744.0, 999.0, 800.0, 367.0, 193.0, 79.0, 40.0, 22.0, 22.0, 11.0, 6.0, 8.0, 8.0, 6.0, 3.0, 0.0, 9.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.6875, -37.49658203125, -36.3056640625, -35.11474609375, -33.923828125, -32.73291015625, -31.5419921875, -30.35107421875, -29.16015625, -27.96923828125, -26.7783203125, -25.58740234375, -24.396484375, -23.20556640625, -22.0146484375, -20.82373046875, -19.6328125, -18.44189453125, -17.2509765625, -16.06005859375, -14.869140625, -13.67822265625, -12.4873046875, -11.29638671875, -10.10546875, -8.91455078125, -7.7236328125, -6.53271484375, -5.341796875, -4.15087890625, -2.9599609375, -1.76904296875, -0.578125, 0.61279296875, 1.8037109375, 2.99462890625, 4.185546875, 5.37646484375, 6.5673828125, 7.75830078125, 8.94921875, 10.14013671875, 11.3310546875, 12.52197265625, 13.712890625, 14.90380859375, 16.0947265625, 17.28564453125, 18.4765625, 19.66748046875, 20.8583984375, 22.04931640625, 23.240234375, 24.43115234375, 25.6220703125, 26.81298828125, 28.00390625, 29.19482421875, 30.3857421875, 31.57666015625, 32.767578125, 33.95849609375, 35.1494140625, 36.34033203125, 37.53125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 12.0, 6.0, 28.0, 36.0, 64.0, 131.0, 226.0, 447.0, 789.0, 1868.0, 3935.0, 9435.0, 30299.0, 533053.0, 3516189.0, 72304.0, 14803.0, 5760.0, 2477.0, 1180.0, 578.0, 304.0, 149.0, 92.0, 46.0, 22.0, 17.0, 8.0, 7.0, 3.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.53125, -54.59716796875, -52.6630859375, -50.72900390625, -48.794921875, -46.86083984375, -44.9267578125, -42.99267578125, -41.05859375, -39.12451171875, -37.1904296875, -35.25634765625, -33.322265625, -31.38818359375, -29.4541015625, -27.52001953125, -25.5859375, -23.65185546875, -21.7177734375, -19.78369140625, -17.849609375, -15.91552734375, -13.9814453125, -12.04736328125, -10.11328125, -8.17919921875, -6.2451171875, -4.31103515625, -2.376953125, -0.44287109375, 1.4912109375, 3.42529296875, 5.359375, 7.29345703125, 9.2275390625, 11.16162109375, 13.095703125, 15.02978515625, 16.9638671875, 18.89794921875, 20.83203125, 22.76611328125, 24.7001953125, 26.63427734375, 28.568359375, 30.50244140625, 32.4365234375, 34.37060546875, 36.3046875, 38.23876953125, 40.1728515625, 42.10693359375, 44.041015625, 45.97509765625, 47.9091796875, 49.84326171875, 51.77734375, 53.71142578125, 55.6455078125, 57.57958984375, 59.513671875, 61.44775390625, 63.3818359375, 65.31591796875, 67.25]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 10.0, 9.0, 18.0, 37.0, 58.0, 100.0, 214.0, 259.0, 137.0, 81.0, 35.0, 23.0, 11.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-233.505859375, -227.22605895996094, -220.94625854492188, -214.6664581298828, -208.38665771484375, -202.10684204101562, -195.82704162597656, -189.5472412109375, -183.26744079589844, -176.98764038085938, -170.7078399658203, -164.42803955078125, -158.14822387695312, -151.86842346191406, -145.588623046875, -139.30882263183594, -133.02902221679688, -126.74922180175781, -120.46942138671875, -114.18961334228516, -107.9098129272461, -101.63001251220703, -95.35020446777344, -89.07040405273438, -82.79060363769531, -76.51080322265625, -70.23100280761719, -63.951194763183594, -57.67139434814453, -51.39159393310547, -45.11178970336914, -38.83198547363281, -32.55220031738281, -26.272397994995117, -19.992595672607422, -13.712793350219727, -7.432991027832031, -1.153188705444336, 5.126613616943359, 11.406417846679688, 17.68621826171875, 23.966020584106445, 30.24582290649414, 36.52562713623047, 42.80542755126953, 49.085227966308594, 55.36503219604492, 61.64483642578125, 67.92463684082031, 74.20443725585938, 80.48423767089844, 86.76404571533203, 93.0438461303711, 99.32364654541016, 105.60345458984375, 111.88325500488281, 118.16305541992188, 124.44285583496094, 130.72265625, 137.00245666503906, 143.28225708007812, 149.56207275390625, 155.8418731689453, 162.12167358398438, 168.40147399902344]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 7.0, 12.0, 11.0, 9.0, 18.0, 17.0, 14.0, 19.0, 17.0, 19.0, 31.0, 23.0, 35.0, 33.0, 52.0, 33.0, 46.0, 58.0, 53.0, 39.0, 29.0, 35.0, 54.0, 38.0, 46.0, 23.0, 31.0, 15.0, 25.0, 26.0, 29.0, 22.0, 17.0, 18.0, 9.0, 12.0, 5.0, 5.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.48394775390625, -73.78535461425781, -71.08676147460938, -68.3881607055664, -65.68956756591797, -62.99097442626953, -60.292381286621094, -57.59378433227539, -54.89518737792969, -52.19659423828125, -49.49799728393555, -46.79940414428711, -44.100807189941406, -41.40221405029297, -38.70362091064453, -36.00502395629883, -33.30643081665039, -30.60783576965332, -27.90924072265625, -25.210647583007812, -22.51205062866211, -19.813457489013672, -17.1148624420166, -14.416267395019531, -11.717672348022461, -9.01907730102539, -6.3204827308654785, -3.6218881607055664, -0.9232931137084961, 1.7753019332885742, 4.473896026611328, 7.172491073608398, 9.871086120605469, 12.569681167602539, 15.26827621459961, 17.966869354248047, 20.66546630859375, 23.364059448242188, 26.062654495239258, 28.761249542236328, 31.4598445892334, 34.15843963623047, 36.857032775878906, 39.55562973022461, 42.25422286987305, 44.95281982421875, 47.65141296386719, 50.350006103515625, 53.04860305786133, 55.747196197509766, 58.44579315185547, 61.144386291503906, 63.84298324584961, 66.54158020019531, 69.24017333984375, 71.93876647949219, 74.63735961914062, 77.33595275878906, 80.0345458984375, 82.73314666748047, 85.4317398071289, 88.13033294677734, 90.82892608642578, 93.52752685546875, 96.22611999511719]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 8.0, 9.0, 8.0, 8.0, 15.0, 21.0, 15.0, 12.0, 21.0, 31.0, 27.0, 39.0, 41.0, 49.0, 38.0, 41.0, 42.0, 52.0, 55.0, 65.0, 44.0, 36.0, 49.0, 36.0, 28.0, 25.0, 22.0, 25.0, 27.0, 21.0, 18.0, 18.0, 12.0, 10.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.2265625, -12.83935546875, -12.4521484375, -12.06494140625, -11.677734375, -11.29052734375, -10.9033203125, -10.51611328125, -10.12890625, -9.74169921875, -9.3544921875, -8.96728515625, -8.580078125, -8.19287109375, -7.8056640625, -7.41845703125, -7.03125, -6.64404296875, -6.2568359375, -5.86962890625, -5.482421875, -5.09521484375, -4.7080078125, -4.32080078125, -3.93359375, -3.54638671875, -3.1591796875, -2.77197265625, -2.384765625, -1.99755859375, -1.6103515625, -1.22314453125, -0.8359375, -0.44873046875, -0.0615234375, 0.32568359375, 0.712890625, 1.10009765625, 1.4873046875, 1.87451171875, 2.26171875, 2.64892578125, 3.0361328125, 3.42333984375, 3.810546875, 4.19775390625, 4.5849609375, 4.97216796875, 5.359375, 5.74658203125, 6.1337890625, 6.52099609375, 6.908203125, 7.29541015625, 7.6826171875, 8.06982421875, 8.45703125, 8.84423828125, 9.2314453125, 9.61865234375, 10.005859375, 10.39306640625, 10.7802734375, 11.16748046875, 11.5546875]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 6.0, 5.0, 3.0, 7.0, 10.0, 23.0, 23.0, 29.0, 48.0, 74.0, 104.0, 157.0, 227.0, 299.0, 463.0, 712.0, 1079.0, 1648.0, 2438.0, 3738.0, 6039.0, 9404.0, 14980.0, 24935.0, 41653.0, 72753.0, 138169.0, 266100.0, 212307.0, 105339.0, 57183.0, 33203.0, 20553.0, 12685.0, 7823.0, 4968.0, 3241.0, 2028.0, 1338.0, 889.0, 604.0, 408.0, 262.0, 177.0, 123.0, 101.0, 64.0, 55.0, 29.0, 18.0, 17.0, 11.0, 5.0, 3.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.076171875, -1.042327880859375, -1.00848388671875, -0.974639892578125, -0.9407958984375, -0.906951904296875, -0.87310791015625, -0.839263916015625, -0.805419921875, -0.771575927734375, -0.73773193359375, -0.703887939453125, -0.6700439453125, -0.636199951171875, -0.60235595703125, -0.568511962890625, -0.53466796875, -0.500823974609375, -0.46697998046875, -0.433135986328125, -0.3992919921875, -0.365447998046875, -0.33160400390625, -0.297760009765625, -0.263916015625, -0.230072021484375, -0.19622802734375, -0.162384033203125, -0.1285400390625, -0.094696044921875, -0.06085205078125, -0.027008056640625, 0.0068359375, 0.040679931640625, 0.07452392578125, 0.108367919921875, 0.1422119140625, 0.176055908203125, 0.20989990234375, 0.243743896484375, 0.277587890625, 0.311431884765625, 0.34527587890625, 0.379119873046875, 0.4129638671875, 0.446807861328125, 0.48065185546875, 0.514495849609375, 0.54833984375, 0.582183837890625, 0.61602783203125, 0.649871826171875, 0.6837158203125, 0.717559814453125, 0.75140380859375, 0.785247802734375, 0.819091796875, 0.852935791015625, 0.88677978515625, 0.920623779296875, 0.9544677734375, 0.988311767578125, 1.02215576171875, 1.055999755859375, 1.08984375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 8.0, 7.0, 6.0, 12.0, 16.0, 13.0, 24.0, 20.0, 25.0, 26.0, 42.0, 22.0, 40.0, 39.0, 35.0, 35.0, 41.0, 57.0, 1068.0, 45.0, 47.0, 35.0, 33.0, 41.0, 38.0, 29.0, 37.0, 24.0, 27.0, 12.0, 26.0, 21.0, 15.0, 11.0, 11.0, 12.0, 5.0, 3.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.3984375, -7.1605224609375, -6.922607421875, -6.6846923828125, -6.44677734375, -6.2088623046875, -5.970947265625, -5.7330322265625, -5.4951171875, -5.2572021484375, -5.019287109375, -4.7813720703125, -4.54345703125, -4.3055419921875, -4.067626953125, -3.8297119140625, -3.591796875, -3.3538818359375, -3.115966796875, -2.8780517578125, -2.64013671875, -2.4022216796875, -2.164306640625, -1.9263916015625, -1.6884765625, -1.4505615234375, -1.212646484375, -0.9747314453125, -0.73681640625, -0.4989013671875, -0.260986328125, -0.0230712890625, 0.21484375, 0.4527587890625, 0.690673828125, 0.9285888671875, 1.16650390625, 1.4044189453125, 1.642333984375, 1.8802490234375, 2.1181640625, 2.3560791015625, 2.593994140625, 2.8319091796875, 3.06982421875, 3.3077392578125, 3.545654296875, 3.7835693359375, 4.021484375, 4.2593994140625, 4.497314453125, 4.7352294921875, 4.97314453125, 5.2110595703125, 5.448974609375, 5.6868896484375, 5.9248046875, 6.1627197265625, 6.400634765625, 6.6385498046875, 6.87646484375, 7.1143798828125, 7.352294921875, 7.5902099609375, 7.828125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 13.0, 13.0, 23.0, 38.0, 54.0, 92.0, 158.0, 191.0, 356.0, 641.0, 1091.0, 2122.0, 3865.0, 7865.0, 15478.0, 31491.0, 67376.0, 153841.0, 1406126.0, 228004.0, 93244.0, 42775.0, 20632.0, 10208.0, 5422.0, 2659.0, 1390.0, 783.0, 449.0, 253.0, 183.0, 98.0, 66.0, 42.0, 29.0, 18.0, 13.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.623046875, -1.5762786865234375, -1.529510498046875, -1.4827423095703125, -1.43597412109375, -1.3892059326171875, -1.342437744140625, -1.2956695556640625, -1.2489013671875, -1.2021331787109375, -1.155364990234375, -1.1085968017578125, -1.06182861328125, -1.0150604248046875, -0.968292236328125, -0.9215240478515625, -0.874755859375, -0.8279876708984375, -0.781219482421875, -0.7344512939453125, -0.68768310546875, -0.6409149169921875, -0.594146728515625, -0.5473785400390625, -0.5006103515625, -0.4538421630859375, -0.407073974609375, -0.3603057861328125, -0.31353759765625, -0.2667694091796875, -0.220001220703125, -0.1732330322265625, -0.12646484375, -0.0796966552734375, -0.032928466796875, 0.0138397216796875, 0.06060791015625, 0.1073760986328125, 0.154144287109375, 0.2009124755859375, 0.2476806640625, 0.2944488525390625, 0.341217041015625, 0.3879852294921875, 0.43475341796875, 0.4815216064453125, 0.528289794921875, 0.5750579833984375, 0.621826171875, 0.6685943603515625, 0.715362548828125, 0.7621307373046875, 0.80889892578125, 0.8556671142578125, 0.902435302734375, 0.9492034912109375, 0.9959716796875, 1.0427398681640625, 1.089508056640625, 1.1362762451171875, 1.18304443359375, 1.2298126220703125, 1.276580810546875, 1.3233489990234375, 1.3701171875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 2.0, 8.0, 5.0, 6.0, 7.0, 12.0, 16.0, 9.0, 15.0, 18.0, 21.0, 37.0, 34.0, 42.0, 34.0, 50.0, 49.0, 47.0, 49.0, 48.0, 54.0, 43.0, 47.0, 42.0, 48.0, 30.0, 38.0, 25.0, 28.0, 18.0, 21.0, 17.0, 18.0, 11.0, 6.0, 10.0, 11.0, 8.0, 5.0, 2.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0023822784423828125, -0.0023102760314941406, -0.0022382736206054688, -0.002166271209716797, -0.002094268798828125, -0.002022266387939453, -0.0019502639770507812, -0.0018782615661621094, -0.0018062591552734375, -0.0017342567443847656, -0.0016622543334960938, -0.0015902519226074219, -0.00151824951171875, -0.0014462471008300781, -0.0013742446899414062, -0.0013022422790527344, -0.0012302398681640625, -0.0011582374572753906, -0.0010862350463867188, -0.0010142326354980469, -0.000942230224609375, -0.0008702278137207031, -0.0007982254028320312, -0.0007262229919433594, -0.0006542205810546875, -0.0005822181701660156, -0.0005102157592773438, -0.0004382133483886719, -0.0003662109375, -0.0002942085266113281, -0.00022220611572265625, -0.00015020370483398438, -7.82012939453125e-05, -6.198883056640625e-06, 6.580352783203125e-05, 0.00013780593872070312, 0.000209808349609375, 0.0002818107604980469, 0.00035381317138671875, 0.0004258155822753906, 0.0004978179931640625, 0.0005698204040527344, 0.0006418228149414062, 0.0007138252258300781, 0.00078582763671875, 0.0008578300476074219, 0.0009298324584960938, 0.0010018348693847656, 0.0010738372802734375, 0.0011458396911621094, 0.0012178421020507812, 0.0012898445129394531, 0.001361846923828125, 0.0014338493347167969, 0.0015058517456054688, 0.0015778541564941406, 0.0016498565673828125, 0.0017218589782714844, 0.0017938613891601562, 0.0018658638000488281, 0.0019378662109375, 0.002009868621826172, 0.0020818710327148438, 0.0021538734436035156, 0.0022258758544921875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 3.0, 9.0, 14.0, 14.0, 15.0, 21.0, 26.0, 40.0, 51.0, 65.0, 88.0, 125.0, 166.0, 229.0, 381.0, 1073.0, 35712.0, 984116.0, 24183.0, 965.0, 392.0, 226.0, 171.0, 140.0, 85.0, 69.0, 39.0, 40.0, 31.0, 13.0, 13.0, 8.0, 4.0, 3.0, 3.0, 5.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049346923828125, -0.04782676696777344, -0.046306610107421875, -0.04478645324707031, -0.04326629638671875, -0.04174613952636719, -0.040225982666015625, -0.03870582580566406, -0.0371856689453125, -0.03566551208496094, -0.034145355224609375, -0.03262519836425781, -0.03110504150390625, -0.029584884643554688, -0.028064727783203125, -0.026544570922851562, -0.0250244140625, -0.023504257202148438, -0.021984100341796875, -0.020463943481445312, -0.01894378662109375, -0.017423629760742188, -0.015903472900390625, -0.014383316040039062, -0.0128631591796875, -0.011343002319335938, -0.009822845458984375, -0.008302688598632812, -0.00678253173828125, -0.0052623748779296875, -0.003742218017578125, -0.0022220611572265625, -0.000701904296875, 0.0008182525634765625, 0.002338409423828125, 0.0038585662841796875, 0.00537872314453125, 0.0068988800048828125, 0.008419036865234375, 0.009939193725585938, 0.0114593505859375, 0.012979507446289062, 0.014499664306640625, 0.016019821166992188, 0.01753997802734375, 0.019060134887695312, 0.020580291748046875, 0.022100448608398438, 0.02362060546875, 0.025140762329101562, 0.026660919189453125, 0.028181076049804688, 0.02970123291015625, 0.031221389770507812, 0.032741546630859375, 0.03426170349121094, 0.0357818603515625, 0.03730201721191406, 0.038822174072265625, 0.04034233093261719, 0.04186248779296875, 0.04338264465332031, 0.044902801513671875, 0.04642295837402344, 0.047943115234375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 10.0, 27.0, 131.0, 428.0, 322.0, 75.0, 19.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003859537187963724, -0.0036300986539572477, -0.0034006601199507713, -0.0031712218187749386, -0.002941783284768462, -0.0027123447507619858, -0.002482906449586153, -0.0022534679155796766, -0.0020240293815732002, -0.0017945908475667238, -0.0015651524299755692, -0.0013357140123844147, -0.0011062754783779383, -0.0008768369443714619, -0.0006473985267803073, -0.0004179601091891527, -0.00018852157518267632, 4.0916900616139174e-05, 0.00027035537641495466, 0.0004997938522137702, 0.0007292323280125856, 0.000958670862019062, 0.0011881092796102166, 0.0014175476972013712, 0.0016469862312078476, 0.001876424765214324, 0.0021058632992208004, 0.002335301600396633, 0.0025647401344031096, 0.002794178668409586, 0.0030236169695854187, 0.003253055503591895, 0.003482493571937084, 0.0037119321059435606, 0.003941370639950037, 0.00417080894112587, 0.00440024770796299, 0.0046296860091388226, 0.004859124310314655, 0.005088563077151775, 0.005318001378327608, 0.005547439679503441, 0.005776878446340561, 0.006006316747516394, 0.006235755048692226, 0.0064651938155293465, 0.006694632116705179, 0.006924070417881012, 0.007153509184718132, 0.007382947485893965, 0.007612386252731085, 0.007841824553906918, 0.008071263320744038, 0.008300701156258583, 0.008530139923095703, 0.008759578689932823, 0.008989017456769943, 0.009218456223607063, 0.009447894059121609, 0.009677332825958729, 0.009906771592795849, 0.010136209428310394, 0.010365648195147514, 0.010595086961984634, 0.01082452479749918]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 13.0, 12.0, 17.0, 14.0, 26.0, 14.0, 31.0, 21.0, 24.0, 34.0, 34.0, 43.0, 43.0, 48.0, 53.0, 38.0, 47.0, 48.0, 44.0, 42.0, 42.0, 44.0, 41.0, 34.0, 25.0, 32.0, 25.0, 20.0, 22.0, 17.0, 9.0, 9.0, 8.0, 8.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014436841011047363, -0.001396162435412407, -0.0013486407697200775, -0.001301119104027748, -0.0012535974383354187, -0.0012060757726430893, -0.0011585541069507599, -0.0011110324412584305, -0.001063510775566101, -0.0010159891098737717, -0.0009684674441814423, -0.0009209457784891129, -0.0008734241127967834, -0.000825902447104454, -0.0007783807814121246, -0.0007308591157197952, -0.0006833374500274658, -0.0006358157843351364, -0.000588294118642807, -0.0005407724529504776, -0.0004932507872581482, -0.0004457291215658188, -0.0003982074558734894, -0.00035068579018116, -0.00030316412448883057, -0.00025564245879650116, -0.00020812079310417175, -0.00016059912741184235, -0.00011307746171951294, -6.555579602718353e-05, -1.8034130334854126e-05, 2.948753535747528e-05, 7.700920104980469e-05, 0.0001245308667421341, 0.0001720525324344635, 0.0002195741981267929, 0.0002670958638191223, 0.0003146175295114517, 0.00036213919520378113, 0.00040966086089611053, 0.00045718252658843994, 0.0005047041922807693, 0.0005522258579730988, 0.0005997475236654282, 0.0006472691893577576, 0.000694790855050087, 0.0007423125207424164, 0.0007898341864347458, 0.0008373558521270752, 0.0008848775178194046, 0.000932399183511734, 0.0009799208492040634, 0.0010274425148963928, 0.0010749641805887222, 0.0011224858462810516, 0.001170007511973381, 0.0012175291776657104, 0.0012650508433580399, 0.0013125725090503693, 0.0013600941747426987, 0.001407615840435028, 0.0014551375061273575, 0.0015026591718196869, 0.0015501808375120163, 0.0015977025032043457]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 8.0, 9.0, 8.0, 8.0, 15.0, 21.0, 15.0, 12.0, 21.0, 31.0, 27.0, 39.0, 41.0, 49.0, 38.0, 41.0, 42.0, 52.0, 55.0, 65.0, 44.0, 36.0, 48.0, 37.0, 28.0, 25.0, 22.0, 25.0, 27.0, 21.0, 18.0, 18.0, 12.0, 10.0, 10.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.2265625, -12.83935546875, -12.4521484375, -12.06494140625, -11.677734375, -11.29052734375, -10.9033203125, -10.51611328125, -10.12890625, -9.74169921875, -9.3544921875, -8.96728515625, -8.580078125, -8.19287109375, -7.8056640625, -7.41845703125, -7.03125, -6.64404296875, -6.2568359375, -5.86962890625, -5.482421875, -5.09521484375, -4.7080078125, -4.32080078125, -3.93359375, -3.54638671875, -3.1591796875, -2.77197265625, -2.384765625, -1.99755859375, -1.6103515625, -1.22314453125, -0.8359375, -0.44873046875, -0.0615234375, 0.32568359375, 0.712890625, 1.10009765625, 1.4873046875, 1.87451171875, 2.26171875, 2.64892578125, 3.0361328125, 3.42333984375, 3.810546875, 4.19775390625, 4.5849609375, 4.97216796875, 5.359375, 5.74658203125, 6.1337890625, 6.52099609375, 6.908203125, 7.29541015625, 7.6826171875, 8.06982421875, 8.45703125, 8.84423828125, 9.2314453125, 9.61865234375, 10.005859375, 10.39306640625, 10.7802734375, 11.16748046875, 11.5546875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 9.0, 5.0, 13.0, 8.0, 23.0, 25.0, 35.0, 65.0, 62.0, 77.0, 134.0, 162.0, 224.0, 303.0, 423.0, 561.0, 922.0, 1361.0, 2199.0, 4013.0, 8759.0, 25254.0, 121462.0, 657565.0, 171067.0, 31784.0, 10345.0, 4549.0, 2362.0, 1518.0, 904.0, 629.0, 448.0, 331.0, 233.0, 201.0, 141.0, 82.0, 86.0, 48.0, 41.0, 31.0, 20.0, 14.0, 9.0, 6.0, 10.0, 3.0, 7.0, 6.0, 2.0, 2.0, 4.0], "bins": [-12.8515625, -12.47998046875, -12.1083984375, -11.73681640625, -11.365234375, -10.99365234375, -10.6220703125, -10.25048828125, -9.87890625, -9.50732421875, -9.1357421875, -8.76416015625, -8.392578125, -8.02099609375, -7.6494140625, -7.27783203125, -6.90625, -6.53466796875, -6.1630859375, -5.79150390625, -5.419921875, -5.04833984375, -4.6767578125, -4.30517578125, -3.93359375, -3.56201171875, -3.1904296875, -2.81884765625, -2.447265625, -2.07568359375, -1.7041015625, -1.33251953125, -0.9609375, -0.58935546875, -0.2177734375, 0.15380859375, 0.525390625, 0.89697265625, 1.2685546875, 1.64013671875, 2.01171875, 2.38330078125, 2.7548828125, 3.12646484375, 3.498046875, 3.86962890625, 4.2412109375, 4.61279296875, 4.984375, 5.35595703125, 5.7275390625, 6.09912109375, 6.470703125, 6.84228515625, 7.2138671875, 7.58544921875, 7.95703125, 8.32861328125, 8.7001953125, 9.07177734375, 9.443359375, 9.81494140625, 10.1865234375, 10.55810546875, 10.9296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 8.0, 7.0, 5.0, 5.0, 12.0, 12.0, 19.0, 20.0, 23.0, 18.0, 37.0, 30.0, 32.0, 42.0, 40.0, 45.0, 56.0, 68.0, 332.0, 1717.0, 88.0, 61.0, 47.0, 36.0, 58.0, 27.0, 34.0, 33.0, 24.0, 24.0, 21.0, 18.0, 9.0, 9.0, 8.0, 9.0, 3.0, 6.0, 2.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-46.15625, -44.84375, -43.53125, -42.21875, -40.90625, -39.59375, -38.28125, -36.96875, -35.65625, -34.34375, -33.03125, -31.71875, -30.40625, -29.09375, -27.78125, -26.46875, -25.15625, -23.84375, -22.53125, -21.21875, -19.90625, -18.59375, -17.28125, -15.96875, -14.65625, -13.34375, -12.03125, -10.71875, -9.40625, -8.09375, -6.78125, -5.46875, -4.15625, -2.84375, -1.53125, -0.21875, 1.09375, 2.40625, 3.71875, 5.03125, 6.34375, 7.65625, 8.96875, 10.28125, 11.59375, 12.90625, 14.21875, 15.53125, 16.84375, 18.15625, 19.46875, 20.78125, 22.09375, 23.40625, 24.71875, 26.03125, 27.34375, 28.65625, 29.96875, 31.28125, 32.59375, 33.90625, 35.21875, 36.53125, 37.84375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 6.0, 7.0, 13.0, 12.0, 13.0, 29.0, 42.0, 55.0, 85.0, 94.0, 208.0, 460.0, 1946.0, 25968.0, 3107951.0, 6907.0, 1081.0, 342.0, 154.0, 88.0, 70.0, 42.0, 33.0, 22.0, 23.0, 8.0, 7.0, 13.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-95.75, -92.591796875, -89.43359375, -86.275390625, -83.1171875, -79.958984375, -76.80078125, -73.642578125, -70.484375, -67.326171875, -64.16796875, -61.009765625, -57.8515625, -54.693359375, -51.53515625, -48.376953125, -45.21875, -42.060546875, -38.90234375, -35.744140625, -32.5859375, -29.427734375, -26.26953125, -23.111328125, -19.953125, -16.794921875, -13.63671875, -10.478515625, -7.3203125, -4.162109375, -1.00390625, 2.154296875, 5.3125, 8.470703125, 11.62890625, 14.787109375, 17.9453125, 21.103515625, 24.26171875, 27.419921875, 30.578125, 33.736328125, 36.89453125, 40.052734375, 43.2109375, 46.369140625, 49.52734375, 52.685546875, 55.84375, 59.001953125, 62.16015625, 65.318359375, 68.4765625, 71.634765625, 74.79296875, 77.951171875, 81.109375, 84.267578125, 87.42578125, 90.583984375, 93.7421875, 96.900390625, 100.05859375, 103.216796875, 106.375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 377.0, 633.0, 7.0], "bins": [-801.2980346679688, -788.3875122070312, -775.4769897460938, -762.5664672851562, -749.6559448242188, -736.745361328125, -723.8348388671875, -710.92431640625, -698.0137939453125, -685.103271484375, -672.1927490234375, -659.2822265625, -646.3717041015625, -633.461181640625, -620.5505981445312, -607.6400756835938, -594.7295532226562, -581.8190307617188, -568.9085083007812, -555.9979858398438, -543.0874633789062, -530.1768798828125, -517.266357421875, -504.3558349609375, -491.4453430175781, -478.5348205566406, -465.6242980957031, -452.7137451171875, -439.80322265625, -426.8927001953125, -413.982177734375, -401.0716552734375, -388.1611022949219, -375.2505798339844, -362.3400573730469, -349.42950439453125, -336.51898193359375, -323.60845947265625, -310.69793701171875, -297.78741455078125, -284.8768615722656, -271.9663391113281, -259.0558166503906, -246.14527893066406, -233.2347412109375, -220.32421875, -207.4136962890625, -194.50315856933594, -181.59262084960938, -168.68209838867188, -155.7715606689453, -142.8610382080078, -129.95050048828125, -117.03997802734375, -104.12944793701172, -91.21891784667969, -78.30838775634766, -65.39785766601562, -52.487327575683594, -39.57680130004883, -26.666271209716797, -13.755744934082031, -0.84521484375, 12.065315246582031, 24.97584342956543]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 5.0, 1.0, 9.0, 9.0, 9.0, 10.0, 12.0, 15.0, 15.0, 34.0, 22.0, 33.0, 29.0, 45.0, 43.0, 50.0, 38.0, 44.0, 37.0, 45.0, 31.0, 36.0, 51.0, 40.0, 40.0, 33.0, 40.0, 35.0, 27.0, 24.0, 22.0, 21.0, 19.0, 18.0, 16.0, 12.0, 13.0, 10.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0], "bins": [-146.93112182617188, -143.2152557373047, -139.4993896484375, -135.7835235595703, -132.06765747070312, -128.35179138183594, -124.63593292236328, -120.9200668334961, -117.2042007446289, -113.48833465576172, -109.77246856689453, -106.05661010742188, -102.34074401855469, -98.6248779296875, -94.90901184082031, -91.19314575195312, -87.47727966308594, -83.76141357421875, -80.04554748535156, -76.32968139648438, -72.61382293701172, -68.89795684814453, -65.18209075927734, -61.466224670410156, -57.7503662109375, -54.03450012207031, -50.31863784790039, -46.6027717590332, -42.886905670166016, -39.171043395996094, -35.455177307128906, -31.73931121826172, -28.02344512939453, -24.307580947875977, -20.59171485900879, -16.875850677490234, -13.159985542297363, -9.444120407104492, -5.7282562255859375, -2.01239013671875, 1.7034740447998047, 5.419339179992676, 9.135204315185547, 12.851068496704102, 16.566932678222656, 20.282798767089844, 23.9986629486084, 27.714529037475586, 31.43039321899414, 35.14625930786133, 38.86212158203125, 42.57798767089844, 46.293853759765625, 50.00971984863281, 53.725582122802734, 57.44144821166992, 61.157310485839844, 64.87317657470703, 68.58904266357422, 72.30490112304688, 76.02076721191406, 79.73663330078125, 83.45249938964844, 87.16836547851562, 90.88423156738281]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 10.0, 8.0, 5.0, 7.0, 11.0, 13.0, 15.0, 25.0, 18.0, 16.0, 31.0, 28.0, 28.0, 42.0, 42.0, 46.0, 45.0, 36.0, 47.0, 64.0, 60.0, 41.0, 38.0, 40.0, 45.0, 30.0, 21.0, 28.0, 22.0, 23.0, 21.0, 18.0, 17.0, 15.0, 17.0, 9.0, 6.0, 3.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.2578125, -12.8707275390625, -12.483642578125, -12.0965576171875, -11.70947265625, -11.3223876953125, -10.935302734375, -10.5482177734375, -10.1611328125, -9.7740478515625, -9.386962890625, -8.9998779296875, -8.61279296875, -8.2257080078125, -7.838623046875, -7.4515380859375, -7.064453125, -6.6773681640625, -6.290283203125, -5.9031982421875, -5.51611328125, -5.1290283203125, -4.741943359375, -4.3548583984375, -3.9677734375, -3.5806884765625, -3.193603515625, -2.8065185546875, -2.41943359375, -2.0323486328125, -1.645263671875, -1.2581787109375, -0.87109375, -0.4840087890625, -0.096923828125, 0.2901611328125, 0.67724609375, 1.0643310546875, 1.451416015625, 1.8385009765625, 2.2255859375, 2.6126708984375, 2.999755859375, 3.3868408203125, 3.77392578125, 4.1610107421875, 4.548095703125, 4.9351806640625, 5.322265625, 5.7093505859375, 6.096435546875, 6.4835205078125, 6.87060546875, 7.2576904296875, 7.644775390625, 8.0318603515625, 8.4189453125, 8.8060302734375, 9.193115234375, 9.5802001953125, 9.96728515625, 10.3543701171875, 10.741455078125, 11.1285400390625, 11.515625]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 3.0, 4.0, 4.0, 7.0, 8.0, 8.0, 17.0, 18.0, 31.0, 20.0, 40.0, 67.0, 92.0, 125.0, 148.0, 214.0, 302.0, 438.0, 665.0, 1016.0, 1739.0, 2898.0, 5346.0, 20555.0, 205216.0, 1901758.0, 1828025.0, 189460.0, 22562.0, 5585.0, 2973.0, 1721.0, 1047.0, 655.0, 482.0, 277.0, 220.0, 140.0, 102.0, 85.0, 42.0, 57.0, 31.0, 24.0, 10.0, 13.0, 10.0, 10.0, 6.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-22.515625, -21.811767578125, -21.10791015625, -20.404052734375, -19.7001953125, -18.996337890625, -18.29248046875, -17.588623046875, -16.884765625, -16.180908203125, -15.47705078125, -14.773193359375, -14.0693359375, -13.365478515625, -12.66162109375, -11.957763671875, -11.25390625, -10.550048828125, -9.84619140625, -9.142333984375, -8.4384765625, -7.734619140625, -7.03076171875, -6.326904296875, -5.623046875, -4.919189453125, -4.21533203125, -3.511474609375, -2.8076171875, -2.103759765625, -1.39990234375, -0.696044921875, 0.0078125, 0.711669921875, 1.41552734375, 2.119384765625, 2.8232421875, 3.527099609375, 4.23095703125, 4.934814453125, 5.638671875, 6.342529296875, 7.04638671875, 7.750244140625, 8.4541015625, 9.157958984375, 9.86181640625, 10.565673828125, 11.26953125, 11.973388671875, 12.67724609375, 13.381103515625, 14.0849609375, 14.788818359375, 15.49267578125, 16.196533203125, 16.900390625, 17.604248046875, 18.30810546875, 19.011962890625, 19.7158203125, 20.419677734375, 21.12353515625, 21.827392578125, 22.53125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 8.0, 7.0, 9.0, 14.0, 22.0, 20.0, 45.0, 62.0, 99.0, 206.0, 332.0, 638.0, 857.0, 708.0, 468.0, 244.0, 127.0, 54.0, 35.0, 20.0, 20.0, 17.0, 14.0, 7.0, 5.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.65625, -33.62744140625, -32.5986328125, -31.56982421875, -30.541015625, -29.51220703125, -28.4833984375, -27.45458984375, -26.42578125, -25.39697265625, -24.3681640625, -23.33935546875, -22.310546875, -21.28173828125, -20.2529296875, -19.22412109375, -18.1953125, -17.16650390625, -16.1376953125, -15.10888671875, -14.080078125, -13.05126953125, -12.0224609375, -10.99365234375, -9.96484375, -8.93603515625, -7.9072265625, -6.87841796875, -5.849609375, -4.82080078125, -3.7919921875, -2.76318359375, -1.734375, -0.70556640625, 0.3232421875, 1.35205078125, 2.380859375, 3.40966796875, 4.4384765625, 5.46728515625, 6.49609375, 7.52490234375, 8.5537109375, 9.58251953125, 10.611328125, 11.64013671875, 12.6689453125, 13.69775390625, 14.7265625, 15.75537109375, 16.7841796875, 17.81298828125, 18.841796875, 19.87060546875, 20.8994140625, 21.92822265625, 22.95703125, 23.98583984375, 25.0146484375, 26.04345703125, 27.072265625, 28.10107421875, 29.1298828125, 30.15869140625, 31.1875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 9.0, 10.0, 16.0, 32.0, 49.0, 64.0, 110.0, 164.0, 323.0, 551.0, 998.0, 1890.0, 3966.0, 8803.0, 22936.0, 106175.0, 3022321.0, 942620.0, 54309.0, 15915.0, 6605.0, 3032.0, 1470.0, 771.0, 469.0, 247.0, 161.0, 100.0, 59.0, 36.0, 26.0, 18.0, 9.0, 6.0, 7.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.9375, -36.5234375, -35.109375, -33.6953125, -32.28125, -30.8671875, -29.453125, -28.0390625, -26.625, -25.2109375, -23.796875, -22.3828125, -20.96875, -19.5546875, -18.140625, -16.7265625, -15.3125, -13.8984375, -12.484375, -11.0703125, -9.65625, -8.2421875, -6.828125, -5.4140625, -4.0, -2.5859375, -1.171875, 0.2421875, 1.65625, 3.0703125, 4.484375, 5.8984375, 7.3125, 8.7265625, 10.140625, 11.5546875, 12.96875, 14.3828125, 15.796875, 17.2109375, 18.625, 20.0390625, 21.453125, 22.8671875, 24.28125, 25.6953125, 27.109375, 28.5234375, 29.9375, 31.3515625, 32.765625, 34.1796875, 35.59375, 37.0078125, 38.421875, 39.8359375, 41.25, 42.6640625, 44.078125, 45.4921875, 46.90625, 48.3203125, 49.734375, 51.1484375, 52.5625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 8.0, 52.0, 300.0, 556.0, 77.0, 18.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-518.7662963867188, -498.95367431640625, -479.1410217285156, -459.3283996582031, -439.5157470703125, -419.703125, -399.8905029296875, -380.077880859375, -360.2652282714844, -340.4526062011719, -320.63995361328125, -300.82733154296875, -281.01470947265625, -261.2020568847656, -241.38943481445312, -221.57679748535156, -201.76416015625, -181.95152282714844, -162.13888549804688, -142.32626342773438, -122.51362609863281, -102.70098876953125, -82.88835906982422, -63.07572937011719, -43.263092041015625, -23.450458526611328, -3.6378250122070312, 16.174808502197266, 35.98744201660156, 55.800079345703125, 75.61270904541016, 95.42533874511719, 115.238037109375, 135.05067443847656, 154.86331176757812, 174.67593383789062, 194.4885711669922, 214.30120849609375, 234.11383056640625, 253.9264678955078, 273.7391052246094, 293.5517272949219, 313.3643798828125, 333.177001953125, 352.9896240234375, 372.8022766113281, 392.6148986816406, 412.42755126953125, 432.24017333984375, 452.05279541015625, 471.8654479980469, 491.6780700683594, 511.49072265625, 531.3033447265625, 551.115966796875, 570.9285888671875, 590.7412109375, 610.5538330078125, 630.366455078125, 650.1791381835938, 669.9917602539062, 689.8043823242188, 709.6170043945312, 729.4296264648438, 749.2423095703125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 9.0, 15.0, 7.0, 17.0, 13.0, 17.0, 15.0, 18.0, 29.0, 29.0, 26.0, 44.0, 28.0, 32.0, 41.0, 45.0, 39.0, 51.0, 41.0, 44.0, 41.0, 38.0, 31.0, 35.0, 32.0, 36.0, 31.0, 30.0, 28.0, 23.0, 18.0, 11.0, 17.0, 8.0, 12.0, 10.0, 12.0, 4.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-81.4825439453125, -78.90315246582031, -76.3237533569336, -73.7443618774414, -71.16497039794922, -68.5855712890625, -66.00617980957031, -63.426788330078125, -60.84739303588867, -58.26799774169922, -55.68860626220703, -53.10921096801758, -50.529815673828125, -47.95042419433594, -45.371028900146484, -42.79163360595703, -40.212242126464844, -37.63284683227539, -35.0534553527832, -32.47406005859375, -29.89466667175293, -27.31527328491211, -24.735877990722656, -22.156484603881836, -19.577091217041016, -16.997697830200195, -14.418303489685059, -11.838909149169922, -9.259515762329102, -6.680122375488281, -4.1007280349731445, -1.5213336944580078, 1.0580673217773438, 3.6374611854553223, 6.216855049133301, 8.796249389648438, 11.375642776489258, 13.955036163330078, 16.53443145751953, 19.11382484436035, 21.693218231201172, 24.272611618041992, 26.852005004882812, 29.431400299072266, 32.01079559326172, 34.590187072753906, 37.16958236694336, 39.74897766113281, 42.328369140625, 44.90776443481445, 47.48715591430664, 50.066551208496094, 52.64594268798828, 55.225337982177734, 57.80473327636719, 60.384124755859375, 62.96352005004883, 65.54291534423828, 68.12230682373047, 70.70169830322266, 73.28109741210938, 75.86048889160156, 78.43988037109375, 81.01927947998047, 83.59867095947266]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 8.0, 5.0, 5.0, 8.0, 12.0, 11.0, 14.0, 24.0, 12.0, 30.0, 34.0, 24.0, 35.0, 40.0, 35.0, 41.0, 51.0, 57.0, 46.0, 36.0, 52.0, 35.0, 51.0, 32.0, 56.0, 39.0, 22.0, 37.0, 22.0, 18.0, 17.0, 18.0, 16.0, 12.0, 12.0, 11.0, 3.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0078125, -13.6080322265625, -13.208251953125, -12.8084716796875, -12.40869140625, -12.0089111328125, -11.609130859375, -11.2093505859375, -10.8095703125, -10.4097900390625, -10.010009765625, -9.6102294921875, -9.21044921875, -8.8106689453125, -8.410888671875, -8.0111083984375, -7.611328125, -7.2115478515625, -6.811767578125, -6.4119873046875, -6.01220703125, -5.6124267578125, -5.212646484375, -4.8128662109375, -4.4130859375, -4.0133056640625, -3.613525390625, -3.2137451171875, -2.81396484375, -2.4141845703125, -2.014404296875, -1.6146240234375, -1.21484375, -0.8150634765625, -0.415283203125, -0.0155029296875, 0.38427734375, 0.7840576171875, 1.183837890625, 1.5836181640625, 1.9833984375, 2.3831787109375, 2.782958984375, 3.1827392578125, 3.58251953125, 3.9822998046875, 4.382080078125, 4.7818603515625, 5.181640625, 5.5814208984375, 5.981201171875, 6.3809814453125, 6.78076171875, 7.1805419921875, 7.580322265625, 7.9801025390625, 8.3798828125, 8.7796630859375, 9.179443359375, 9.5792236328125, 9.97900390625, 10.3787841796875, 10.778564453125, 11.1783447265625, 11.578125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 12.0, 12.0, 17.0, 28.0, 41.0, 57.0, 83.0, 150.0, 188.0, 322.0, 472.0, 726.0, 1119.0, 1722.0, 2875.0, 4245.0, 6940.0, 10948.0, 17504.0, 28215.0, 48305.0, 87119.0, 171175.0, 279773.0, 173563.0, 88023.0, 48633.0, 28861.0, 17513.0, 10926.0, 6925.0, 4273.0, 2750.0, 1787.0, 1134.0, 722.0, 486.0, 321.0, 197.0, 129.0, 85.0, 61.0, 44.0, 28.0, 20.0, 12.0, 6.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0634765625, -1.027435302734375, -0.99139404296875, -0.955352783203125, -0.9193115234375, -0.883270263671875, -0.84722900390625, -0.811187744140625, -0.775146484375, -0.739105224609375, -0.70306396484375, -0.667022705078125, -0.6309814453125, -0.594940185546875, -0.55889892578125, -0.522857666015625, -0.48681640625, -0.450775146484375, -0.41473388671875, -0.378692626953125, -0.3426513671875, -0.306610107421875, -0.27056884765625, -0.234527587890625, -0.198486328125, -0.162445068359375, -0.12640380859375, -0.090362548828125, -0.0543212890625, -0.018280029296875, 0.01776123046875, 0.053802490234375, 0.08984375, 0.125885009765625, 0.16192626953125, 0.197967529296875, 0.2340087890625, 0.270050048828125, 0.30609130859375, 0.342132568359375, 0.378173828125, 0.414215087890625, 0.45025634765625, 0.486297607421875, 0.5223388671875, 0.558380126953125, 0.59442138671875, 0.630462646484375, 0.66650390625, 0.702545166015625, 0.73858642578125, 0.774627685546875, 0.8106689453125, 0.846710205078125, 0.88275146484375, 0.918792724609375, 0.954833984375, 0.990875244140625, 1.02691650390625, 1.062957763671875, 1.0989990234375, 1.135040283203125, 1.17108154296875, 1.207122802734375, 1.2431640625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 7.0, 8.0, 8.0, 11.0, 19.0, 11.0, 7.0, 16.0, 25.0, 30.0, 26.0, 26.0, 28.0, 36.0, 41.0, 29.0, 32.0, 35.0, 33.0, 30.0, 26.0, 1064.0, 30.0, 37.0, 37.0, 25.0, 21.0, 27.0, 27.0, 37.0, 29.0, 25.0, 14.0, 13.0, 16.0, 16.0, 12.0, 10.0, 17.0, 10.0, 11.0, 8.0, 10.0, 14.0, 6.0, 7.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0], "bins": [-6.421875, -6.22979736328125, -6.0377197265625, -5.84564208984375, -5.653564453125, -5.46148681640625, -5.2694091796875, -5.07733154296875, -4.88525390625, -4.69317626953125, -4.5010986328125, -4.30902099609375, -4.116943359375, -3.92486572265625, -3.7327880859375, -3.54071044921875, -3.3486328125, -3.15655517578125, -2.9644775390625, -2.77239990234375, -2.580322265625, -2.38824462890625, -2.1961669921875, -2.00408935546875, -1.81201171875, -1.61993408203125, -1.4278564453125, -1.23577880859375, -1.043701171875, -0.85162353515625, -0.6595458984375, -0.46746826171875, -0.275390625, -0.08331298828125, 0.1087646484375, 0.30084228515625, 0.492919921875, 0.68499755859375, 0.8770751953125, 1.06915283203125, 1.26123046875, 1.45330810546875, 1.6453857421875, 1.83746337890625, 2.029541015625, 2.22161865234375, 2.4136962890625, 2.60577392578125, 2.7978515625, 2.98992919921875, 3.1820068359375, 3.37408447265625, 3.566162109375, 3.75823974609375, 3.9503173828125, 4.14239501953125, 4.33447265625, 4.52655029296875, 4.7186279296875, 4.91070556640625, 5.102783203125, 5.29486083984375, 5.4869384765625, 5.67901611328125, 5.87109375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 5.0, 8.0, 12.0, 12.0, 22.0, 27.0, 30.0, 61.0, 63.0, 96.0, 157.0, 224.0, 320.0, 524.0, 772.0, 1195.0, 1874.0, 2928.0, 4695.0, 7266.0, 11083.0, 17769.0, 28623.0, 46109.0, 80091.0, 152880.0, 1306637.0, 190999.0, 97544.0, 55156.0, 33276.0, 20309.0, 13055.0, 8273.0, 5281.0, 3505.0, 2177.0, 1400.0, 950.0, 576.0, 352.0, 255.0, 167.0, 107.0, 94.0, 57.0, 37.0, 25.0, 11.0, 21.0, 9.0, 10.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.96826171875, -0.9366836547851562, -0.9051055908203125, -0.8735275268554688, -0.841949462890625, -0.8103713989257812, -0.7787933349609375, -0.7472152709960938, -0.71563720703125, -0.6840591430664062, -0.6524810791015625, -0.6209030151367188, -0.589324951171875, -0.5577468872070312, -0.5261688232421875, -0.49459075927734375, -0.4630126953125, -0.43143463134765625, -0.3998565673828125, -0.36827850341796875, -0.336700439453125, -0.30512237548828125, -0.2735443115234375, -0.24196624755859375, -0.21038818359375, -0.17881011962890625, -0.1472320556640625, -0.11565399169921875, -0.084075927734375, -0.05249786376953125, -0.0209197998046875, 0.01065826416015625, 0.042236328125, 0.07381439208984375, 0.1053924560546875, 0.13697052001953125, 0.168548583984375, 0.20012664794921875, 0.2317047119140625, 0.26328277587890625, 0.29486083984375, 0.32643890380859375, 0.3580169677734375, 0.38959503173828125, 0.421173095703125, 0.45275115966796875, 0.4843292236328125, 0.5159072875976562, 0.5474853515625, 0.5790634155273438, 0.6106414794921875, 0.6422195434570312, 0.673797607421875, 0.7053756713867188, 0.7369537353515625, 0.7685317993164062, 0.80010986328125, 0.8316879272460938, 0.8632659912109375, 0.8948440551757812, 0.926422119140625, 0.9580001831054688, 0.9895782470703125, 1.0211563110351562, 1.052734375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 8.0, 3.0, 10.0, 11.0, 13.0, 12.0, 13.0, 24.0, 27.0, 34.0, 35.0, 37.0, 46.0, 47.0, 56.0, 64.0, 70.0, 72.0, 65.0, 63.0, 57.0, 45.0, 31.0, 35.0, 29.0, 31.0, 15.0, 9.0, 4.0, 7.0, 10.0, 5.0, 9.0, 1.0, 0.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0029735565185546875, -0.0028873085975646973, -0.002801060676574707, -0.002714812755584717, -0.0026285648345947266, -0.0025423169136047363, -0.002456068992614746, -0.002369821071624756, -0.0022835731506347656, -0.0021973252296447754, -0.002111077308654785, -0.002024829387664795, -0.0019385814666748047, -0.0018523335456848145, -0.0017660856246948242, -0.001679837703704834, -0.0015935897827148438, -0.0015073418617248535, -0.0014210939407348633, -0.001334846019744873, -0.0012485980987548828, -0.0011623501777648926, -0.0010761022567749023, -0.0009898543357849121, -0.0009036064147949219, -0.0008173584938049316, -0.0007311105728149414, -0.0006448626518249512, -0.0005586147308349609, -0.0004723668098449707, -0.00038611888885498047, -0.00029987096786499023, -0.000213623046875, -0.00012737512588500977, -4.112720489501953e-05, 4.51207160949707e-05, 0.00013136863708496094, 0.00021761655807495117, 0.0003038644790649414, 0.00039011240005493164, 0.0004763603210449219, 0.0005626082420349121, 0.0006488561630249023, 0.0007351040840148926, 0.0008213520050048828, 0.000907599925994873, 0.0009938478469848633, 0.0010800957679748535, 0.0011663436889648438, 0.001252591609954834, 0.0013388395309448242, 0.0014250874519348145, 0.0015113353729248047, 0.001597583293914795, 0.0016838312149047852, 0.0017700791358947754, 0.0018563270568847656, 0.0019425749778747559, 0.002028822898864746, 0.0021150708198547363, 0.0022013187408447266, 0.002287566661834717, 0.002373814582824707, 0.0024600625038146973, 0.0025463104248046875]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 7.0, 11.0, 6.0, 11.0, 18.0, 17.0, 26.0, 40.0, 57.0, 68.0, 96.0, 154.0, 220.0, 443.0, 1883.0, 88400.0, 943700.0, 11619.0, 830.0, 315.0, 174.0, 113.0, 94.0, 43.0, 59.0, 33.0, 21.0, 22.0, 17.0, 13.0, 8.0, 4.0, 5.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046630859375, -0.045038700103759766, -0.04344654083251953, -0.0418543815612793, -0.04026222229003906, -0.03867006301879883, -0.037077903747558594, -0.03548574447631836, -0.033893585205078125, -0.03230142593383789, -0.030709266662597656, -0.029117107391357422, -0.027524948120117188, -0.025932788848876953, -0.02434062957763672, -0.022748470306396484, -0.02115631103515625, -0.019564151763916016, -0.01797199249267578, -0.016379833221435547, -0.014787673950195312, -0.013195514678955078, -0.011603355407714844, -0.01001119613647461, -0.008419036865234375, -0.006826877593994141, -0.005234718322753906, -0.003642559051513672, -0.0020503997802734375, -0.0004582405090332031, 0.0011339187622070312, 0.0027260780334472656, 0.0043182373046875, 0.005910396575927734, 0.007502555847167969, 0.009094715118408203, 0.010686874389648438, 0.012279033660888672, 0.013871192932128906, 0.01546335220336914, 0.017055511474609375, 0.01864767074584961, 0.020239830017089844, 0.021831989288330078, 0.023424148559570312, 0.025016307830810547, 0.02660846710205078, 0.028200626373291016, 0.02979278564453125, 0.031384944915771484, 0.03297710418701172, 0.03456926345825195, 0.03616142272949219, 0.03775358200073242, 0.039345741271972656, 0.04093790054321289, 0.042530059814453125, 0.04412221908569336, 0.045714378356933594, 0.04730653762817383, 0.04889869689941406, 0.0504908561706543, 0.05208301544189453, 0.053675174713134766, 0.055267333984375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 10.0, 104.0, 606.0, 269.0, 20.0, 7.0], "bins": [-0.022555707022547722, -0.022184167057275772, -0.021812627092003822, -0.021441087126731873, -0.021069545298814774, -0.020698005333542824, -0.020326465368270874, -0.019954925402998924, -0.019583385437726974, -0.019211845472455025, -0.018840305507183075, -0.018468765541911125, -0.018097223713994026, -0.017725683748722076, -0.017354143783450127, -0.016982603818178177, -0.016611063852906227, -0.016239523887634277, -0.015867983922362328, -0.015496443025767803, -0.015124903060495853, -0.014753363095223904, -0.01438182219862938, -0.01401028223335743, -0.013638741336762905, -0.013267201371490955, -0.012895660474896431, -0.012524120509624481, -0.012152580544352531, -0.011781040579080582, -0.011409499682486057, -0.011037959717214108, -0.010666419751942158, -0.010294879786670208, -0.009923338890075684, -0.009551798924803734, -0.009180258959531784, -0.008808718994259834, -0.00843717809766531, -0.00806563813239336, -0.00769409816712141, -0.007322557736188173, -0.0069510177709162235, -0.0065794773399829865, -0.006207937374711037, -0.0058363969437778, -0.0054648565128445625, -0.005093316547572613, -0.004721776582300663, -0.004350236151367426, -0.003978696186095476, -0.003607155755162239, -0.0032356157898902893, -0.0028640753589570522, -0.002492535160854459, -0.0021209949627518654, -0.0017494545318186283, -0.0013779143337160349, -0.0010063741356134415, -0.0006348338210955262, -0.0002632936229929328, 0.00010824657510966063, 0.0004797868896275759, 0.0008513270877301693, 0.0012228672858327627]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 6.0, 12.0, 9.0, 7.0, 16.0, 20.0, 23.0, 23.0, 31.0, 19.0, 30.0, 37.0, 42.0, 40.0, 44.0, 40.0, 37.0, 48.0, 49.0, 43.0, 47.0, 29.0, 37.0, 27.0, 43.0, 33.0, 26.0, 26.0, 19.0, 26.0, 18.0, 17.0, 17.0, 10.0, 6.0, 4.0, 9.0, 7.0, 5.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014628767967224121, -0.001420825719833374, -0.001378774642944336, -0.0013367235660552979, -0.0012946724891662598, -0.0012526214122772217, -0.0012105703353881836, -0.0011685192584991455, -0.0011264681816101074, -0.0010844171047210693, -0.0010423660278320312, -0.0010003149509429932, -0.0009582638740539551, -0.000916212797164917, -0.0008741617202758789, -0.0008321106433868408, -0.0007900595664978027, -0.0007480084896087646, -0.0007059574127197266, -0.0006639063358306885, -0.0006218552589416504, -0.0005798041820526123, -0.0005377531051635742, -0.0004957020282745361, -0.00045365095138549805, -0.00041159987449645996, -0.0003695487976074219, -0.0003274977207183838, -0.0002854466438293457, -0.00024339556694030762, -0.00020134449005126953, -0.00015929341316223145, -0.00011724233627319336, -7.519125938415527e-05, -3.314018249511719e-05, 8.910894393920898e-06, 5.0961971282958984e-05, 9.301304817199707e-05, 0.00013506412506103516, 0.00017711520195007324, 0.00021916627883911133, 0.0002612173557281494, 0.0003032684326171875, 0.0003453195095062256, 0.00038737058639526367, 0.00042942166328430176, 0.00047147274017333984, 0.0005135238170623779, 0.000555574893951416, 0.0005976259708404541, 0.0006396770477294922, 0.0006817281246185303, 0.0007237792015075684, 0.0007658302783966064, 0.0008078813552856445, 0.0008499324321746826, 0.0008919835090637207, 0.0009340345859527588, 0.0009760856628417969, 0.001018136739730835, 0.001060187816619873, 0.0011022388935089111, 0.0011442899703979492, 0.0011863410472869873, 0.0012283921241760254]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 6.0, 5.0, 8.0, 5.0, 5.0, 8.0, 12.0, 11.0, 14.0, 24.0, 12.0, 30.0, 34.0, 24.0, 35.0, 40.0, 35.0, 41.0, 51.0, 57.0, 46.0, 36.0, 52.0, 35.0, 51.0, 32.0, 56.0, 39.0, 22.0, 37.0, 22.0, 18.0, 17.0, 18.0, 16.0, 12.0, 12.0, 11.0, 3.0, 7.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.0078125, -13.6080322265625, -13.208251953125, -12.8084716796875, -12.40869140625, -12.0089111328125, -11.609130859375, -11.2093505859375, -10.8095703125, -10.4097900390625, -10.010009765625, -9.6102294921875, -9.21044921875, -8.8106689453125, -8.410888671875, -8.0111083984375, -7.611328125, -7.2115478515625, -6.811767578125, -6.4119873046875, -6.01220703125, -5.6124267578125, -5.212646484375, -4.8128662109375, -4.4130859375, -4.0133056640625, -3.613525390625, -3.2137451171875, -2.81396484375, -2.4141845703125, -2.014404296875, -1.6146240234375, -1.21484375, -0.8150634765625, -0.415283203125, -0.0155029296875, 0.38427734375, 0.7840576171875, 1.183837890625, 1.5836181640625, 1.9833984375, 2.3831787109375, 2.782958984375, 3.1827392578125, 3.58251953125, 3.9822998046875, 4.382080078125, 4.7818603515625, 5.181640625, 5.5814208984375, 5.981201171875, 6.3809814453125, 6.78076171875, 7.1805419921875, 7.580322265625, 7.9801025390625, 8.3798828125, 8.7796630859375, 9.179443359375, 9.5792236328125, 9.97900390625, 10.3787841796875, 10.778564453125, 11.1783447265625, 11.578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 8.0, 6.0, 5.0, 8.0, 14.0, 28.0, 25.0, 37.0, 50.0, 62.0, 94.0, 143.0, 272.0, 446.0, 792.0, 1569.0, 3518.0, 8994.0, 25744.0, 90584.0, 434672.0, 366254.0, 78070.0, 22536.0, 8019.0, 3224.0, 1479.0, 729.0, 413.0, 246.0, 159.0, 91.0, 78.0, 50.0, 47.0, 22.0, 21.0, 9.0, 9.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.21875, -8.9622802734375, -8.705810546875, -8.4493408203125, -8.19287109375, -7.9364013671875, -7.679931640625, -7.4234619140625, -7.1669921875, -6.9105224609375, -6.654052734375, -6.3975830078125, -6.14111328125, -5.8846435546875, -5.628173828125, -5.3717041015625, -5.115234375, -4.8587646484375, -4.602294921875, -4.3458251953125, -4.08935546875, -3.8328857421875, -3.576416015625, -3.3199462890625, -3.0634765625, -2.8070068359375, -2.550537109375, -2.2940673828125, -2.03759765625, -1.7811279296875, -1.524658203125, -1.2681884765625, -1.01171875, -0.7552490234375, -0.498779296875, -0.2423095703125, 0.01416015625, 0.2706298828125, 0.527099609375, 0.7835693359375, 1.0400390625, 1.2965087890625, 1.552978515625, 1.8094482421875, 2.06591796875, 2.3223876953125, 2.578857421875, 2.8353271484375, 3.091796875, 3.3482666015625, 3.604736328125, 3.8612060546875, 4.11767578125, 4.3741455078125, 4.630615234375, 4.8870849609375, 5.1435546875, 5.4000244140625, 5.656494140625, 5.9129638671875, 6.16943359375, 6.4259033203125, 6.682373046875, 6.9388427734375, 7.1953125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 6.0, 5.0, 5.0, 6.0, 14.0, 13.0, 17.0, 15.0, 21.0, 20.0, 25.0, 33.0, 32.0, 27.0, 47.0, 35.0, 35.0, 36.0, 64.0, 177.0, 1814.0, 142.0, 48.0, 39.0, 40.0, 36.0, 40.0, 28.0, 34.0, 28.0, 21.0, 31.0, 15.0, 20.0, 13.0, 11.0, 7.0, 11.0, 5.0, 7.0, 5.0, 6.0, 6.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-39.40625, -38.18994140625, -36.9736328125, -35.75732421875, -34.541015625, -33.32470703125, -32.1083984375, -30.89208984375, -29.67578125, -28.45947265625, -27.2431640625, -26.02685546875, -24.810546875, -23.59423828125, -22.3779296875, -21.16162109375, -19.9453125, -18.72900390625, -17.5126953125, -16.29638671875, -15.080078125, -13.86376953125, -12.6474609375, -11.43115234375, -10.21484375, -8.99853515625, -7.7822265625, -6.56591796875, -5.349609375, -4.13330078125, -2.9169921875, -1.70068359375, -0.484375, 0.73193359375, 1.9482421875, 3.16455078125, 4.380859375, 5.59716796875, 6.8134765625, 8.02978515625, 9.24609375, 10.46240234375, 11.6787109375, 12.89501953125, 14.111328125, 15.32763671875, 16.5439453125, 17.76025390625, 18.9765625, 20.19287109375, 21.4091796875, 22.62548828125, 23.841796875, 25.05810546875, 26.2744140625, 27.49072265625, 28.70703125, 29.92333984375, 31.1396484375, 32.35595703125, 33.572265625, 34.78857421875, 36.0048828125, 37.22119140625, 38.4375]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 4.0, 6.0, 2.0, 9.0, 4.0, 9.0, 4.0, 7.0, 10.0, 9.0, 14.0, 20.0, 20.0, 37.0, 36.0, 47.0, 66.0, 72.0, 102.0, 138.0, 228.0, 275.0, 586.0, 2985.0, 2675446.0, 461764.0, 2254.0, 530.0, 272.0, 193.0, 133.0, 108.0, 69.0, 55.0, 34.0, 28.0, 31.0, 20.0, 16.0, 19.0, 12.0, 11.0, 8.0, 4.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.375, -73.90625, -71.4375, -68.96875, -66.5, -64.03125, -61.5625, -59.09375, -56.625, -54.15625, -51.6875, -49.21875, -46.75, -44.28125, -41.8125, -39.34375, -36.875, -34.40625, -31.9375, -29.46875, -27.0, -24.53125, -22.0625, -19.59375, -17.125, -14.65625, -12.1875, -9.71875, -7.25, -4.78125, -2.3125, 0.15625, 2.625, 5.09375, 7.5625, 10.03125, 12.5, 14.96875, 17.4375, 19.90625, 22.375, 24.84375, 27.3125, 29.78125, 32.25, 34.71875, 37.1875, 39.65625, 42.125, 44.59375, 47.0625, 49.53125, 52.0, 54.46875, 56.9375, 59.40625, 61.875, 64.34375, 66.8125, 69.28125, 71.75, 74.21875, 76.6875, 79.15625, 81.625]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [21.0, 499.0, 470.0, 27.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.086040496826172, -6.152369976043701, -0.21869945526123047, 5.714971542358398, 11.648641586303711, 17.582311630249023, 23.51598358154297, 29.44965362548828, 35.383323669433594, 41.316993713378906, 47.25066375732422, 53.18433380126953, 59.118003845214844, 65.05167388916016, 70.9853515625, 76.91902160644531, 82.85269165039062, 88.78636169433594, 94.72003173828125, 100.65370178222656, 106.58737182617188, 112.52104187011719, 118.4547119140625, 124.38838195800781, 130.32205200195312, 136.25572204589844, 142.18939208984375, 148.12306213378906, 154.05673217773438, 159.9904022216797, 165.924072265625, 171.8577423095703, 177.7914276123047, 183.72509765625, 189.6587677001953, 195.59243774414062, 201.52610778808594, 207.45977783203125, 213.39344787597656, 219.32711791992188, 225.2607879638672, 231.1944580078125, 237.1281280517578, 243.06179809570312, 248.99546813964844, 254.92913818359375, 260.8628234863281, 266.7964782714844, 272.73016357421875, 278.6638488769531, 284.5975036621094, 290.53118896484375, 296.46484375, 302.3985290527344, 308.3321838378906, 314.265869140625, 320.19952392578125, 326.1332092285156, 332.0668640136719, 338.00054931640625, 343.9342041015625, 349.8678894042969, 355.8015441894531, 361.7352294921875, 367.66888427734375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 3.0, 5.0, 4.0, 5.0, 9.0, 12.0, 14.0, 13.0, 19.0, 15.0, 21.0, 21.0, 22.0, 24.0, 25.0, 33.0, 31.0, 42.0, 32.0, 41.0, 34.0, 46.0, 30.0, 41.0, 40.0, 40.0, 44.0, 25.0, 30.0, 28.0, 23.0, 34.0, 20.0, 27.0, 12.0, 17.0, 19.0, 13.0, 13.0, 13.0, 13.0, 13.0, 7.0, 4.0, 4.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-90.28437042236328, -87.35931396484375, -84.43425750732422, -81.50920104980469, -78.58414459228516, -75.65908813476562, -72.7340316772461, -69.80897521972656, -66.88391876220703, -63.9588623046875, -61.03380584716797, -58.10874938964844, -55.183692932128906, -52.258636474609375, -49.333580017089844, -46.40852355957031, -43.48346710205078, -40.55841064453125, -37.63335418701172, -34.70829772949219, -31.783241271972656, -28.858184814453125, -25.933128356933594, -23.008071899414062, -20.08301544189453, -17.157958984375, -14.232902526855469, -11.307846069335938, -8.382789611816406, -5.457733154296875, -2.5326766967773438, 0.3923797607421875, 3.3174362182617188, 6.24249267578125, 9.167549133300781, 12.092605590820312, 15.017662048339844, 17.942718505859375, 20.867774963378906, 23.792831420898438, 26.71788787841797, 29.6429443359375, 32.56800079345703, 35.49305725097656, 38.418113708496094, 41.343170166015625, 44.268226623535156, 47.19328308105469, 50.11833953857422, 53.04339599609375, 55.96845245361328, 58.89350891113281, 61.818565368652344, 64.74362182617188, 67.6686782836914, 70.59373474121094, 73.51879119873047, 76.44384765625, 79.36890411376953, 82.29396057128906, 85.2190170288086, 88.14407348632812, 91.06912994384766, 93.99418640136719, 96.91924285888672]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 6.0, 8.0, 6.0, 6.0, 11.0, 9.0, 11.0, 16.0, 15.0, 23.0, 26.0, 33.0, 20.0, 32.0, 35.0, 34.0, 41.0, 54.0, 45.0, 49.0, 38.0, 48.0, 37.0, 47.0, 30.0, 43.0, 49.0, 32.0, 29.0, 24.0, 25.0, 21.0, 16.0, 15.0, 13.0, 12.0, 15.0, 6.0, 6.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.6328125, -13.246826171875, -12.86083984375, -12.474853515625, -12.0888671875, -11.702880859375, -11.31689453125, -10.930908203125, -10.544921875, -10.158935546875, -9.77294921875, -9.386962890625, -9.0009765625, -8.614990234375, -8.22900390625, -7.843017578125, -7.45703125, -7.071044921875, -6.68505859375, -6.299072265625, -5.9130859375, -5.527099609375, -5.14111328125, -4.755126953125, -4.369140625, -3.983154296875, -3.59716796875, -3.211181640625, -2.8251953125, -2.439208984375, -2.05322265625, -1.667236328125, -1.28125, -0.895263671875, -0.50927734375, -0.123291015625, 0.2626953125, 0.648681640625, 1.03466796875, 1.420654296875, 1.806640625, 2.192626953125, 2.57861328125, 2.964599609375, 3.3505859375, 3.736572265625, 4.12255859375, 4.508544921875, 4.89453125, 5.280517578125, 5.66650390625, 6.052490234375, 6.4384765625, 6.824462890625, 7.21044921875, 7.596435546875, 7.982421875, 8.368408203125, 8.75439453125, 9.140380859375, 9.5263671875, 9.912353515625, 10.29833984375, 10.684326171875, 11.0703125]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 6.0, 8.0, 7.0, 5.0, 5.0, 13.0, 12.0, 5.0, 16.0, 21.0, 20.0, 34.0, 29.0, 56.0, 63.0, 126.0, 238.0, 612.0, 1726.0, 6020.0, 130081.0, 3989020.0, 58605.0, 4998.0, 1460.0, 496.0, 214.0, 105.0, 67.0, 38.0, 32.0, 28.0, 19.0, 14.0, 21.0, 14.0, 12.0, 12.0, 10.0, 6.0, 6.0, 1.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.625, -69.54443359375, -67.4638671875, -65.38330078125, -63.302734375, -61.22216796875, -59.1416015625, -57.06103515625, -54.98046875, -52.89990234375, -50.8193359375, -48.73876953125, -46.658203125, -44.57763671875, -42.4970703125, -40.41650390625, -38.3359375, -36.25537109375, -34.1748046875, -32.09423828125, -30.013671875, -27.93310546875, -25.8525390625, -23.77197265625, -21.69140625, -19.61083984375, -17.5302734375, -15.44970703125, -13.369140625, -11.28857421875, -9.2080078125, -7.12744140625, -5.046875, -2.96630859375, -0.8857421875, 1.19482421875, 3.275390625, 5.35595703125, 7.4365234375, 9.51708984375, 11.59765625, 13.67822265625, 15.7587890625, 17.83935546875, 19.919921875, 22.00048828125, 24.0810546875, 26.16162109375, 28.2421875, 30.32275390625, 32.4033203125, 34.48388671875, 36.564453125, 38.64501953125, 40.7255859375, 42.80615234375, 44.88671875, 46.96728515625, 49.0478515625, 51.12841796875, 53.208984375, 55.28955078125, 57.3701171875, 59.45068359375, 61.53125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 9.0, 5.0, 6.0, 12.0, 14.0, 17.0, 43.0, 70.0, 115.0, 215.0, 368.0, 654.0, 769.0, 705.0, 438.0, 247.0, 125.0, 72.0, 40.0, 35.0, 23.0, 16.0, 16.0, 11.0, 9.0, 6.0, 9.0, 2.0, 2.0, 4.0, 1.0, 7.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.3125, -28.386962890625, -27.46142578125, -26.535888671875, -25.6103515625, -24.684814453125, -23.75927734375, -22.833740234375, -21.908203125, -20.982666015625, -20.05712890625, -19.131591796875, -18.2060546875, -17.280517578125, -16.35498046875, -15.429443359375, -14.50390625, -13.578369140625, -12.65283203125, -11.727294921875, -10.8017578125, -9.876220703125, -8.95068359375, -8.025146484375, -7.099609375, -6.174072265625, -5.24853515625, -4.322998046875, -3.3974609375, -2.471923828125, -1.54638671875, -0.620849609375, 0.3046875, 1.230224609375, 2.15576171875, 3.081298828125, 4.0068359375, 4.932373046875, 5.85791015625, 6.783447265625, 7.708984375, 8.634521484375, 9.56005859375, 10.485595703125, 11.4111328125, 12.336669921875, 13.26220703125, 14.187744140625, 15.11328125, 16.038818359375, 16.96435546875, 17.889892578125, 18.8154296875, 19.740966796875, 20.66650390625, 21.592041015625, 22.517578125, 23.443115234375, 24.36865234375, 25.294189453125, 26.2197265625, 27.145263671875, 28.07080078125, 28.996337890625, 29.921875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 3.0, 3.0, 5.0, 7.0, 5.0, 10.0, 13.0, 21.0, 32.0, 60.0, 108.0, 198.0, 519.0, 1293.0, 3819.0, 15242.0, 180946.0, 3910099.0, 66965.0, 10327.0, 2827.0, 984.0, 422.0, 166.0, 96.0, 34.0, 22.0, 12.0, 11.0, 10.0, 6.0, 5.0, 1.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-80.75, -78.2548828125, -75.759765625, -73.2646484375, -70.76953125, -68.2744140625, -65.779296875, -63.2841796875, -60.7890625, -58.2939453125, -55.798828125, -53.3037109375, -50.80859375, -48.3134765625, -45.818359375, -43.3232421875, -40.828125, -38.3330078125, -35.837890625, -33.3427734375, -30.84765625, -28.3525390625, -25.857421875, -23.3623046875, -20.8671875, -18.3720703125, -15.876953125, -13.3818359375, -10.88671875, -8.3916015625, -5.896484375, -3.4013671875, -0.90625, 1.5888671875, 4.083984375, 6.5791015625, 9.07421875, 11.5693359375, 14.064453125, 16.5595703125, 19.0546875, 21.5498046875, 24.044921875, 26.5400390625, 29.03515625, 31.5302734375, 34.025390625, 36.5205078125, 39.015625, 41.5107421875, 44.005859375, 46.5009765625, 48.99609375, 51.4912109375, 53.986328125, 56.4814453125, 58.9765625, 61.4716796875, 63.966796875, 66.4619140625, 68.95703125, 71.4521484375, 73.947265625, 76.4423828125, 78.9375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 23.0, 118.0, 533.0, 289.0, 40.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.51449584960938, -87.0298843383789, -68.54527282714844, -50.0606689453125, -31.57605743408203, -13.091445922851562, 5.393157958984375, 23.877777099609375, 42.36238098144531, 60.84699249267578, 79.33160400390625, 97.81620788574219, 116.30081939697266, 134.78543090820312, 153.27003479003906, 171.75465393066406, 190.2392578125, 208.72386169433594, 227.20848083496094, 245.69308471679688, 264.1777038574219, 282.66229248046875, 301.14691162109375, 319.63153076171875, 338.11614990234375, 356.60076904296875, 375.0853576660156, 393.5699768066406, 412.0545959472656, 430.5391845703125, 449.0238037109375, 467.5084228515625, 485.99298095703125, 504.47760009765625, 522.9622192382812, 541.44677734375, 559.931396484375, 578.416015625, 596.900634765625, 615.38525390625, 633.869873046875, 652.3544921875, 670.839111328125, 689.32373046875, 707.8082885742188, 726.2929077148438, 744.7775268554688, 763.2621459960938, 781.7467041015625, 800.2313232421875, 818.7159423828125, 837.2005615234375, 855.6851196289062, 874.1697387695312, 892.6543579101562, 911.1389770507812, 929.6235961914062, 948.1082153320312, 966.5928344726562, 985.077392578125, 1003.56201171875, 1022.046630859375, 1040.53125, 1059.015869140625, 1077.50048828125]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 10.0, 6.0, 7.0, 11.0, 12.0, 17.0, 19.0, 29.0, 34.0, 41.0, 39.0, 45.0, 60.0, 54.0, 48.0, 48.0, 73.0, 44.0, 50.0, 51.0, 43.0, 39.0, 41.0, 37.0, 20.0, 20.0, 16.0, 27.0, 18.0, 10.0, 9.0, 7.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.1269302368164, -92.13861083984375, -89.1502914428711, -86.16197204589844, -83.17365264892578, -80.18533325195312, -77.19700622558594, -74.20869445800781, -71.22036743164062, -68.23204803466797, -65.24372863769531, -62.255409240722656, -59.26708984375, -56.278770446777344, -53.29044723510742, -50.302127838134766, -47.313812255859375, -44.32549285888672, -41.33717346191406, -38.348854064941406, -35.36053466796875, -32.372215270996094, -29.383892059326172, -26.395572662353516, -23.40725326538086, -20.418933868408203, -17.430614471435547, -14.442293167114258, -11.453973770141602, -8.465654373168945, -5.477333068847656, -2.489013671875, 0.499298095703125, 3.4876179695129395, 6.475937843322754, 9.464258193969727, 12.452577590942383, 15.440896987915039, 18.429218292236328, 21.417537689208984, 24.40585708618164, 27.394176483154297, 30.382495880126953, 33.370819091796875, 36.35913848876953, 39.34745788574219, 42.335777282714844, 45.3240966796875, 48.312416076660156, 51.30073547363281, 54.28905487060547, 57.277374267578125, 60.26569366455078, 63.25401306152344, 66.24234008789062, 69.23065185546875, 72.21897888183594, 75.2072982788086, 78.19561767578125, 81.1839370727539, 84.17225646972656, 87.16057586669922, 90.14889526367188, 93.13722229003906, 96.12553405761719]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 2.0, 8.0, 6.0, 8.0, 7.0, 16.0, 13.0, 20.0, 25.0, 20.0, 19.0, 27.0, 25.0, 32.0, 51.0, 36.0, 54.0, 39.0, 41.0, 41.0, 45.0, 41.0, 40.0, 48.0, 33.0, 30.0, 43.0, 37.0, 26.0, 31.0, 23.0, 19.0, 14.0, 19.0, 8.0, 10.0, 6.0, 5.0, 7.0, 6.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.7578125, -13.37451171875, -12.9912109375, -12.60791015625, -12.224609375, -11.84130859375, -11.4580078125, -11.07470703125, -10.69140625, -10.30810546875, -9.9248046875, -9.54150390625, -9.158203125, -8.77490234375, -8.3916015625, -8.00830078125, -7.625, -7.24169921875, -6.8583984375, -6.47509765625, -6.091796875, -5.70849609375, -5.3251953125, -4.94189453125, -4.55859375, -4.17529296875, -3.7919921875, -3.40869140625, -3.025390625, -2.64208984375, -2.2587890625, -1.87548828125, -1.4921875, -1.10888671875, -0.7255859375, -0.34228515625, 0.041015625, 0.42431640625, 0.8076171875, 1.19091796875, 1.57421875, 1.95751953125, 2.3408203125, 2.72412109375, 3.107421875, 3.49072265625, 3.8740234375, 4.25732421875, 4.640625, 5.02392578125, 5.4072265625, 5.79052734375, 6.173828125, 6.55712890625, 6.9404296875, 7.32373046875, 7.70703125, 8.09033203125, 8.4736328125, 8.85693359375, 9.240234375, 9.62353515625, 10.0068359375, 10.39013671875, 10.7734375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 8.0, 6.0, 8.0, 13.0, 16.0, 31.0, 35.0, 54.0, 83.0, 110.0, 139.0, 227.0, 282.0, 463.0, 653.0, 949.0, 1475.0, 2175.0, 3207.0, 4918.0, 7468.0, 11659.0, 18083.0, 28805.0, 48990.0, 87537.0, 163386.0, 255120.0, 178118.0, 95347.0, 52841.0, 30762.0, 19308.0, 12536.0, 7949.0, 5308.0, 3456.0, 2214.0, 1574.0, 1051.0, 648.0, 501.0, 285.0, 228.0, 166.0, 123.0, 70.0, 49.0, 43.0, 28.0, 16.0, 16.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.0400390625, -1.0070953369140625, -0.974151611328125, -0.9412078857421875, -0.90826416015625, -0.8753204345703125, -0.842376708984375, -0.8094329833984375, -0.7764892578125, -0.7435455322265625, -0.710601806640625, -0.6776580810546875, -0.64471435546875, -0.6117706298828125, -0.578826904296875, -0.5458831787109375, -0.512939453125, -0.4799957275390625, -0.447052001953125, -0.4141082763671875, -0.38116455078125, -0.3482208251953125, -0.315277099609375, -0.2823333740234375, -0.2493896484375, -0.2164459228515625, -0.183502197265625, -0.1505584716796875, -0.11761474609375, -0.0846710205078125, -0.051727294921875, -0.0187835693359375, 0.01416015625, 0.0471038818359375, 0.080047607421875, 0.1129913330078125, 0.14593505859375, 0.1788787841796875, 0.211822509765625, 0.2447662353515625, 0.2777099609375, 0.3106536865234375, 0.343597412109375, 0.3765411376953125, 0.40948486328125, 0.4424285888671875, 0.475372314453125, 0.5083160400390625, 0.541259765625, 0.5742034912109375, 0.607147216796875, 0.6400909423828125, 0.67303466796875, 0.7059783935546875, 0.738922119140625, 0.7718658447265625, 0.8048095703125, 0.8377532958984375, 0.870697021484375, 0.9036407470703125, 0.93658447265625, 0.9695281982421875, 1.002471923828125, 1.0354156494140625, 1.068359375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 6.0, 5.0, 8.0, 9.0, 7.0, 14.0, 16.0, 19.0, 24.0, 26.0, 21.0, 35.0, 40.0, 43.0, 49.0, 40.0, 42.0, 52.0, 45.0, 1067.0, 43.0, 47.0, 38.0, 39.0, 43.0, 33.0, 21.0, 35.0, 28.0, 18.0, 22.0, 17.0, 18.0, 17.0, 12.0, 9.0, 5.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.76953125, -7.50445556640625, -7.2393798828125, -6.97430419921875, -6.709228515625, -6.44415283203125, -6.1790771484375, -5.91400146484375, -5.64892578125, -5.38385009765625, -5.1187744140625, -4.85369873046875, -4.588623046875, -4.32354736328125, -4.0584716796875, -3.79339599609375, -3.5283203125, -3.26324462890625, -2.9981689453125, -2.73309326171875, -2.468017578125, -2.20294189453125, -1.9378662109375, -1.67279052734375, -1.40771484375, -1.14263916015625, -0.8775634765625, -0.61248779296875, -0.347412109375, -0.08233642578125, 0.1827392578125, 0.44781494140625, 0.712890625, 0.97796630859375, 1.2430419921875, 1.50811767578125, 1.773193359375, 2.03826904296875, 2.3033447265625, 2.56842041015625, 2.83349609375, 3.09857177734375, 3.3636474609375, 3.62872314453125, 3.893798828125, 4.15887451171875, 4.4239501953125, 4.68902587890625, 4.9541015625, 5.21917724609375, 5.4842529296875, 5.74932861328125, 6.014404296875, 6.27947998046875, 6.5445556640625, 6.80963134765625, 7.07470703125, 7.33978271484375, 7.6048583984375, 7.86993408203125, 8.135009765625, 8.40008544921875, 8.6651611328125, 8.93023681640625, 9.1953125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 10.0, 14.0, 25.0, 26.0, 39.0, 46.0, 93.0, 124.0, 204.0, 326.0, 464.0, 786.0, 1218.0, 2104.0, 3572.0, 6144.0, 10332.0, 18710.0, 34470.0, 67177.0, 139185.0, 1346359.0, 240239.0, 107593.0, 53197.0, 27943.0, 15315.0, 8703.0, 5050.0, 2964.0, 1762.0, 1089.0, 628.0, 427.0, 252.0, 188.0, 109.0, 91.0, 41.0, 34.0, 21.0, 17.0, 14.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.3505859375, -1.3094482421875, -1.268310546875, -1.2271728515625, -1.18603515625, -1.1448974609375, -1.103759765625, -1.0626220703125, -1.021484375, -0.9803466796875, -0.939208984375, -0.8980712890625, -0.85693359375, -0.8157958984375, -0.774658203125, -0.7335205078125, -0.6923828125, -0.6512451171875, -0.610107421875, -0.5689697265625, -0.52783203125, -0.4866943359375, -0.445556640625, -0.4044189453125, -0.36328125, -0.3221435546875, -0.281005859375, -0.2398681640625, -0.19873046875, -0.1575927734375, -0.116455078125, -0.0753173828125, -0.0341796875, 0.0069580078125, 0.048095703125, 0.0892333984375, 0.13037109375, 0.1715087890625, 0.212646484375, 0.2537841796875, 0.294921875, 0.3360595703125, 0.377197265625, 0.4183349609375, 0.45947265625, 0.5006103515625, 0.541748046875, 0.5828857421875, 0.6240234375, 0.6651611328125, 0.706298828125, 0.7474365234375, 0.78857421875, 0.8297119140625, 0.870849609375, 0.9119873046875, 0.953125, 0.9942626953125, 1.035400390625, 1.0765380859375, 1.11767578125, 1.1588134765625, 1.199951171875, 1.2410888671875, 1.2822265625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 7.0, 10.0, 10.0, 15.0, 22.0, 26.0, 25.0, 24.0, 45.0, 41.0, 45.0, 33.0, 54.0, 66.0, 56.0, 63.0, 64.0, 56.0, 48.0, 47.0, 28.0, 34.0, 30.0, 19.0, 15.0, 16.0, 19.0, 13.0, 7.0, 10.0, 11.0, 4.0, 1.0, 5.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002521514892578125, -0.002437978982925415, -0.002354443073272705, -0.002270907163619995, -0.002187371253967285, -0.002103835344314575, -0.0020202994346618652, -0.0019367635250091553, -0.0018532276153564453, -0.0017696917057037354, -0.0016861557960510254, -0.0016026198863983154, -0.0015190839767456055, -0.0014355480670928955, -0.0013520121574401855, -0.0012684762477874756, -0.0011849403381347656, -0.0011014044284820557, -0.0010178685188293457, -0.0009343326091766357, -0.0008507966995239258, -0.0007672607898712158, -0.0006837248802185059, -0.0006001889705657959, -0.0005166530609130859, -0.000433117151260376, -0.000349581241607666, -0.00026604533195495605, -0.0001825094223022461, -9.897351264953613e-05, -1.5437602996826172e-05, 6.809830665588379e-05, 0.00015163421630859375, 0.0002351701259613037, 0.00031870603561401367, 0.00040224194526672363, 0.0004857778549194336, 0.0005693137645721436, 0.0006528496742248535, 0.0007363855838775635, 0.0008199214935302734, 0.0009034574031829834, 0.0009869933128356934, 0.0010705292224884033, 0.0011540651321411133, 0.0012376010417938232, 0.0013211369514465332, 0.0014046728610992432, 0.0014882087707519531, 0.001571744680404663, 0.001655280590057373, 0.001738816499710083, 0.001822352409362793, 0.001905888319015503, 0.001989424228668213, 0.002072960138320923, 0.002156496047973633, 0.0022400319576263428, 0.0023235678672790527, 0.0024071037769317627, 0.0024906396865844727, 0.0025741755962371826, 0.0026577115058898926, 0.0027412474155426025, 0.0028247833251953125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 5.0, 8.0, 12.0, 10.0, 17.0, 27.0, 27.0, 34.0, 48.0, 81.0, 88.0, 168.0, 274.0, 705.0, 6833.0, 934096.0, 103318.0, 1666.0, 410.0, 214.0, 132.0, 98.0, 66.0, 53.0, 33.0, 30.0, 21.0, 15.0, 7.0, 17.0, 9.0, 6.0, 3.0, 3.0, 1.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0531005859375, -0.0512542724609375, -0.049407958984375, -0.0475616455078125, -0.04571533203125, -0.0438690185546875, -0.042022705078125, -0.0401763916015625, -0.038330078125, -0.0364837646484375, -0.034637451171875, -0.0327911376953125, -0.03094482421875, -0.0290985107421875, -0.027252197265625, -0.0254058837890625, -0.0235595703125, -0.0217132568359375, -0.019866943359375, -0.0180206298828125, -0.01617431640625, -0.0143280029296875, -0.012481689453125, -0.0106353759765625, -0.0087890625, -0.0069427490234375, -0.005096435546875, -0.0032501220703125, -0.00140380859375, 0.0004425048828125, 0.002288818359375, 0.0041351318359375, 0.0059814453125, 0.0078277587890625, 0.009674072265625, 0.0115203857421875, 0.01336669921875, 0.0152130126953125, 0.017059326171875, 0.0189056396484375, 0.020751953125, 0.0225982666015625, 0.024444580078125, 0.0262908935546875, 0.02813720703125, 0.0299835205078125, 0.031829833984375, 0.0336761474609375, 0.0355224609375, 0.0373687744140625, 0.039215087890625, 0.0410614013671875, 0.04290771484375, 0.0447540283203125, 0.046600341796875, 0.0484466552734375, 0.05029296875, 0.0521392822265625, 0.053985595703125, 0.0558319091796875, 0.05767822265625, 0.0595245361328125, 0.061370849609375, 0.0632171630859375, 0.0650634765625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 15.0, 23.0, 49.0, 89.0, 230.0, 271.0, 182.0, 88.0, 32.0, 17.0, 10.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025959000922739506, -0.002454104833304882, -0.00231230934150517, -0.0021705140825361013, -0.002028718590736389, -0.0018869233317673206, -0.001745128072798252, -0.0016033326974138618, -0.0014615373220294714, -0.001319741946645081, -0.0011779465712606907, -0.0010361513122916222, -0.0008943559369072318, -0.0007525605615228415, -0.000610765244346112, -0.00046896992716938257, -0.0003271745517849922, -0.00018537920550443232, -4.358385922387242e-05, 9.821148705668747e-05, 0.00024000683333724737, 0.0003818022087216377, 0.0005235975258983672, 0.0006653928430750966, 0.000807188218459487, 0.0009489835938438773, 0.0010907789692282677, 0.0012325742281973362, 0.0013743696035817266, 0.001516164978966117, 0.0016579602379351854, 0.0017997556133195758, 0.0019415514543652534, 0.002083346713334322, 0.002225142205134034, 0.0023669374641031027, 0.002508732955902815, 0.0026505282148718834, 0.002792323473840952, 0.0029341187328100204, 0.0030759142246097326, 0.003217709483578801, 0.0033595049753785133, 0.003501300234347582, 0.0036430954933166504, 0.0037848909851163626, 0.003926686476916075, 0.004068481735885143, 0.004210276994854212, 0.00435207225382328, 0.004493867512792349, 0.004635663237422705, 0.004777458496391773, 0.004919253755360842, 0.00506104901432991, 0.005202844273298979, 0.005344639532268047, 0.005486434791237116, 0.005628230050206184, 0.00577002577483654, 0.005911821033805609, 0.006053616292774677, 0.006195411551743746, 0.006337206810712814, 0.00647900253534317]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 5.0, 2.0, 1.0, 8.0, 8.0, 6.0, 10.0, 9.0, 18.0, 17.0, 25.0, 27.0, 17.0, 40.0, 25.0, 24.0, 39.0, 30.0, 37.0, 34.0, 45.0, 47.0, 43.0, 49.0, 40.0, 41.0, 30.0, 37.0, 34.0, 24.0, 27.0, 35.0, 15.0, 21.0, 25.0, 20.0, 15.0, 26.0, 8.0, 10.0, 10.0, 9.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0013976693153381348, -0.0013534165918827057, -0.0013091638684272766, -0.0012649111449718475, -0.0012206584215164185, -0.0011764056980609894, -0.0011321529746055603, -0.0010879002511501312, -0.0010436475276947021, -0.000999394804239273, -0.000955142080783844, -0.0009108893573284149, -0.0008666366338729858, -0.0008223839104175568, -0.0007781311869621277, -0.0007338784635066986, -0.0006896257400512695, -0.0006453730165958405, -0.0006011202931404114, -0.0005568675696849823, -0.0005126148462295532, -0.00046836212277412415, -0.00042410939931869507, -0.000379856675863266, -0.0003356039524078369, -0.00029135122895240784, -0.00024709850549697876, -0.00020284578204154968, -0.0001585930585861206, -0.00011434033513069153, -7.008761167526245e-05, -2.5834888219833374e-05, 1.8417835235595703e-05, 6.267055869102478e-05, 0.00010692328214645386, 0.00015117600560188293, 0.000195428729057312, 0.0002396814525127411, 0.00028393417596817017, 0.00032818689942359924, 0.0003724396228790283, 0.0004166923463344574, 0.0004609450697898865, 0.0005051977932453156, 0.0005494505167007446, 0.0005937032401561737, 0.0006379559636116028, 0.0006822086870670319, 0.0007264614105224609, 0.00077071413397789, 0.0008149668574333191, 0.0008592195808887482, 0.0009034723043441772, 0.0009477250277996063, 0.0009919777512550354, 0.0010362304747104645, 0.0010804831981658936, 0.0011247359216213226, 0.0011689886450767517, 0.0012132413685321808, 0.0012574940919876099, 0.001301746815443039, 0.001345999538898468, 0.001390252262353897, 0.0014345049858093262]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 2.0, 8.0, 6.0, 8.0, 7.0, 16.0, 13.0, 20.0, 25.0, 20.0, 19.0, 27.0, 25.0, 32.0, 51.0, 36.0, 54.0, 39.0, 41.0, 41.0, 45.0, 41.0, 40.0, 48.0, 32.0, 31.0, 43.0, 37.0, 26.0, 31.0, 23.0, 19.0, 14.0, 19.0, 8.0, 10.0, 6.0, 5.0, 7.0, 6.0, 5.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-13.7578125, -13.37451171875, -12.9912109375, -12.60791015625, -12.224609375, -11.84130859375, -11.4580078125, -11.07470703125, -10.69140625, -10.30810546875, -9.9248046875, -9.54150390625, -9.158203125, -8.77490234375, -8.3916015625, -8.00830078125, -7.625, -7.24169921875, -6.8583984375, -6.47509765625, -6.091796875, -5.70849609375, -5.3251953125, -4.94189453125, -4.55859375, -4.17529296875, -3.7919921875, -3.40869140625, -3.025390625, -2.64208984375, -2.2587890625, -1.87548828125, -1.4921875, -1.10888671875, -0.7255859375, -0.34228515625, 0.041015625, 0.42431640625, 0.8076171875, 1.19091796875, 1.57421875, 1.95751953125, 2.3408203125, 2.72412109375, 3.107421875, 3.49072265625, 3.8740234375, 4.25732421875, 4.640625, 5.02392578125, 5.4072265625, 5.79052734375, 6.173828125, 6.55712890625, 6.9404296875, 7.32373046875, 7.70703125, 8.09033203125, 8.4736328125, 8.85693359375, 9.240234375, 9.62353515625, 10.0068359375, 10.39013671875, 10.7734375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 11.0, 17.0, 11.0, 22.0, 43.0, 44.0, 66.0, 77.0, 125.0, 174.0, 263.0, 347.0, 482.0, 663.0, 914.0, 1477.0, 2147.0, 3512.0, 6800.0, 22201.0, 189220.0, 712670.0, 79553.0, 13432.0, 5278.0, 2910.0, 1875.0, 1243.0, 860.0, 599.0, 404.0, 341.0, 197.0, 145.0, 128.0, 82.0, 50.0, 37.0, 32.0, 30.0, 17.0, 9.0, 11.0, 10.0, 7.0, 5.0, 2.0, 0.0, 3.0, 1.0], "bins": [-12.9453125, -12.578857421875, -12.21240234375, -11.845947265625, -11.4794921875, -11.113037109375, -10.74658203125, -10.380126953125, -10.013671875, -9.647216796875, -9.28076171875, -8.914306640625, -8.5478515625, -8.181396484375, -7.81494140625, -7.448486328125, -7.08203125, -6.715576171875, -6.34912109375, -5.982666015625, -5.6162109375, -5.249755859375, -4.88330078125, -4.516845703125, -4.150390625, -3.783935546875, -3.41748046875, -3.051025390625, -2.6845703125, -2.318115234375, -1.95166015625, -1.585205078125, -1.21875, -0.852294921875, -0.48583984375, -0.119384765625, 0.2470703125, 0.613525390625, 0.97998046875, 1.346435546875, 1.712890625, 2.079345703125, 2.44580078125, 2.812255859375, 3.1787109375, 3.545166015625, 3.91162109375, 4.278076171875, 4.64453125, 5.010986328125, 5.37744140625, 5.743896484375, 6.1103515625, 6.476806640625, 6.84326171875, 7.209716796875, 7.576171875, 7.942626953125, 8.30908203125, 8.675537109375, 9.0419921875, 9.408447265625, 9.77490234375, 10.141357421875, 10.5078125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 3.0, 3.0, 9.0, 9.0, 17.0, 16.0, 11.0, 14.0, 22.0, 29.0, 40.0, 39.0, 36.0, 52.0, 51.0, 56.0, 34.0, 87.0, 1745.0, 293.0, 58.0, 48.0, 42.0, 44.0, 46.0, 36.0, 19.0, 32.0, 16.0, 27.0, 23.0, 23.0, 15.0, 8.0, 3.0, 3.0, 5.0, 9.0, 7.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-40.75, -39.509765625, -38.26953125, -37.029296875, -35.7890625, -34.548828125, -33.30859375, -32.068359375, -30.828125, -29.587890625, -28.34765625, -27.107421875, -25.8671875, -24.626953125, -23.38671875, -22.146484375, -20.90625, -19.666015625, -18.42578125, -17.185546875, -15.9453125, -14.705078125, -13.46484375, -12.224609375, -10.984375, -9.744140625, -8.50390625, -7.263671875, -6.0234375, -4.783203125, -3.54296875, -2.302734375, -1.0625, 0.177734375, 1.41796875, 2.658203125, 3.8984375, 5.138671875, 6.37890625, 7.619140625, 8.859375, 10.099609375, 11.33984375, 12.580078125, 13.8203125, 15.060546875, 16.30078125, 17.541015625, 18.78125, 20.021484375, 21.26171875, 22.501953125, 23.7421875, 24.982421875, 26.22265625, 27.462890625, 28.703125, 29.943359375, 31.18359375, 32.423828125, 33.6640625, 34.904296875, 36.14453125, 37.384765625, 38.625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 14.0, 17.0, 9.0, 17.0, 32.0, 51.0, 72.0, 113.0, 163.0, 469.0, 1990.0, 27793.0, 3105917.0, 7289.0, 1017.0, 287.0, 155.0, 91.0, 53.0, 42.0, 33.0, 20.0, 8.0, 10.0, 5.0, 9.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-123.625, -119.673828125, -115.72265625, -111.771484375, -107.8203125, -103.869140625, -99.91796875, -95.966796875, -92.015625, -88.064453125, -84.11328125, -80.162109375, -76.2109375, -72.259765625, -68.30859375, -64.357421875, -60.40625, -56.455078125, -52.50390625, -48.552734375, -44.6015625, -40.650390625, -36.69921875, -32.748046875, -28.796875, -24.845703125, -20.89453125, -16.943359375, -12.9921875, -9.041015625, -5.08984375, -1.138671875, 2.8125, 6.763671875, 10.71484375, 14.666015625, 18.6171875, 22.568359375, 26.51953125, 30.470703125, 34.421875, 38.373046875, 42.32421875, 46.275390625, 50.2265625, 54.177734375, 58.12890625, 62.080078125, 66.03125, 69.982421875, 73.93359375, 77.884765625, 81.8359375, 85.787109375, 89.73828125, 93.689453125, 97.640625, 101.591796875, 105.54296875, 109.494140625, 113.4453125, 117.396484375, 121.34765625, 125.298828125, 129.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 41.0, 802.0, 174.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-533.0867919921875, -522.7637329101562, -512.4407348632812, -502.11767578125, -491.7946472167969, -481.47161865234375, -471.1485595703125, -460.8255310058594, -450.50250244140625, -440.1794738769531, -429.8564453125, -419.53338623046875, -409.2103576660156, -398.8873291015625, -388.56427001953125, -378.2412414550781, -367.918212890625, -357.5951843261719, -347.27215576171875, -336.9490966796875, -326.6260681152344, -316.30303955078125, -305.97998046875, -295.6569519042969, -285.33392333984375, -275.0108947753906, -264.6878662109375, -254.36480712890625, -244.04177856445312, -233.71875, -223.3957061767578, -213.07266235351562, -202.7496337890625, -192.42660522460938, -182.1035614013672, -171.780517578125, -161.45748901367188, -151.13446044921875, -140.81141662597656, -130.48837280273438, -120.16533660888672, -109.84230041503906, -99.5192642211914, -89.19622802734375, -78.8731918334961, -68.55015563964844, -58.22711944580078, -47.904083251953125, -37.58104705810547, -27.258010864257812, -16.934974670410156, -6.6119384765625, 3.7110977172851562, 14.034133911132812, 24.35717010498047, 34.680206298828125, 45.00324249267578, 55.32627868652344, 65.6493148803711, 75.97235107421875, 86.2953872680664, 96.61842346191406, 106.94145965576172, 117.26449584960938, 127.58753204345703]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 10.0, 6.0, 7.0, 6.0, 6.0, 8.0, 11.0, 10.0, 19.0, 21.0, 13.0, 25.0, 32.0, 41.0, 26.0, 47.0, 40.0, 38.0, 36.0, 38.0, 44.0, 50.0, 37.0, 28.0, 43.0, 43.0, 34.0, 48.0, 25.0, 23.0, 30.0, 31.0, 24.0, 21.0, 22.0, 8.0, 16.0, 11.0, 11.0, 5.0, 10.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.37841796875, -103.84265899658203, -100.30690002441406, -96.77114868164062, -93.23538970947266, -89.69963073730469, -86.16387176513672, -82.62811279296875, -79.09236145019531, -75.55660247802734, -72.02084350585938, -68.48509216308594, -64.94933319091797, -61.41357421875, -57.87781524658203, -54.34205627441406, -50.806297302246094, -47.270538330078125, -43.73478317260742, -40.19902420043945, -36.66326904296875, -33.12751007080078, -29.591751098632812, -26.055994033813477, -22.52023696899414, -18.984479904174805, -15.448721885681152, -11.9129638671875, -8.377206802368164, -4.841449737548828, -1.3056907653808594, 2.2300662994384766, 5.765815734863281, 9.301572799682617, 12.83733081817627, 16.373088836669922, 19.908845901489258, 23.444602966308594, 26.980361938476562, 30.5161190032959, 34.051876068115234, 37.5876350402832, 41.123390197753906, 44.659149169921875, 48.194908142089844, 51.73066329956055, 55.266422271728516, 58.80217742919922, 62.33793640136719, 65.87369537353516, 69.40945434570312, 72.94520568847656, 76.48096466064453, 80.0167236328125, 83.55248260498047, 87.08824157714844, 90.62399291992188, 94.15975189208984, 97.69551086425781, 101.23126220703125, 104.76702117919922, 108.30278015136719, 111.83853912353516, 115.37429809570312, 118.9100570678711]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 7.0, 2.0, 7.0, 5.0, 5.0, 8.0, 4.0, 13.0, 12.0, 17.0, 22.0, 21.0, 26.0, 18.0, 23.0, 24.0, 33.0, 45.0, 37.0, 45.0, 39.0, 40.0, 38.0, 43.0, 46.0, 37.0, 43.0, 28.0, 28.0, 37.0, 35.0, 31.0, 33.0, 26.0, 19.0, 16.0, 17.0, 14.0, 15.0, 7.0, 6.0, 6.0, 9.0, 5.0, 5.0, 2.0, 4.0, 6.0, 3.0, 1.0], "bins": [-13.9296875, -13.5552978515625, -13.180908203125, -12.8065185546875, -12.43212890625, -12.0577392578125, -11.683349609375, -11.3089599609375, -10.9345703125, -10.5601806640625, -10.185791015625, -9.8114013671875, -9.43701171875, -9.0626220703125, -8.688232421875, -8.3138427734375, -7.939453125, -7.5650634765625, -7.190673828125, -6.8162841796875, -6.44189453125, -6.0675048828125, -5.693115234375, -5.3187255859375, -4.9443359375, -4.5699462890625, -4.195556640625, -3.8211669921875, -3.44677734375, -3.0723876953125, -2.697998046875, -2.3236083984375, -1.94921875, -1.5748291015625, -1.200439453125, -0.8260498046875, -0.45166015625, -0.0772705078125, 0.297119140625, 0.6715087890625, 1.0458984375, 1.4202880859375, 1.794677734375, 2.1690673828125, 2.54345703125, 2.9178466796875, 3.292236328125, 3.6666259765625, 4.041015625, 4.4154052734375, 4.789794921875, 5.1641845703125, 5.53857421875, 5.9129638671875, 6.287353515625, 6.6617431640625, 7.0361328125, 7.4105224609375, 7.784912109375, 8.1593017578125, 8.53369140625, 8.9080810546875, 9.282470703125, 9.6568603515625, 10.03125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 4.0, 12.0, 18.0, 21.0, 29.0, 29.0, 43.0, 56.0, 71.0, 119.0, 134.0, 174.0, 262.0, 366.0, 552.0, 728.0, 1066.0, 1539.0, 2496.0, 4084.0, 7710.0, 30571.0, 200990.0, 1226548.0, 2147122.0, 464149.0, 75397.0, 14702.0, 5603.0, 3217.0, 2031.0, 1320.0, 884.0, 614.0, 446.0, 330.0, 239.0, 176.0, 111.0, 64.0, 75.0, 48.0, 33.0, 20.0, 34.0, 16.0, 9.0, 12.0, 4.0, 4.0, 4.0, 0.0, 1.0], "bins": [-20.953125, -20.3583984375, -19.763671875, -19.1689453125, -18.57421875, -17.9794921875, -17.384765625, -16.7900390625, -16.1953125, -15.6005859375, -15.005859375, -14.4111328125, -13.81640625, -13.2216796875, -12.626953125, -12.0322265625, -11.4375, -10.8427734375, -10.248046875, -9.6533203125, -9.05859375, -8.4638671875, -7.869140625, -7.2744140625, -6.6796875, -6.0849609375, -5.490234375, -4.8955078125, -4.30078125, -3.7060546875, -3.111328125, -2.5166015625, -1.921875, -1.3271484375, -0.732421875, -0.1376953125, 0.45703125, 1.0517578125, 1.646484375, 2.2412109375, 2.8359375, 3.4306640625, 4.025390625, 4.6201171875, 5.21484375, 5.8095703125, 6.404296875, 6.9990234375, 7.59375, 8.1884765625, 8.783203125, 9.3779296875, 9.97265625, 10.5673828125, 11.162109375, 11.7568359375, 12.3515625, 12.9462890625, 13.541015625, 14.1357421875, 14.73046875, 15.3251953125, 15.919921875, 16.5146484375, 17.109375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 8.0, 9.0, 14.0, 31.0, 48.0, 84.0, 219.0, 498.0, 932.0, 1070.0, 592.0, 268.0, 111.0, 53.0, 37.0, 25.0, 11.0, 12.0, 10.0, 10.0, 2.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.75, -33.3701171875, -31.990234375, -30.6103515625, -29.23046875, -27.8505859375, -26.470703125, -25.0908203125, -23.7109375, -22.3310546875, -20.951171875, -19.5712890625, -18.19140625, -16.8115234375, -15.431640625, -14.0517578125, -12.671875, -11.2919921875, -9.912109375, -8.5322265625, -7.15234375, -5.7724609375, -4.392578125, -3.0126953125, -1.6328125, -0.2529296875, 1.126953125, 2.5068359375, 3.88671875, 5.2666015625, 6.646484375, 8.0263671875, 9.40625, 10.7861328125, 12.166015625, 13.5458984375, 14.92578125, 16.3056640625, 17.685546875, 19.0654296875, 20.4453125, 21.8251953125, 23.205078125, 24.5849609375, 25.96484375, 27.3447265625, 28.724609375, 30.1044921875, 31.484375, 32.8642578125, 34.244140625, 35.6240234375, 37.00390625, 38.3837890625, 39.763671875, 41.1435546875, 42.5234375, 43.9033203125, 45.283203125, 46.6630859375, 48.04296875, 49.4228515625, 50.802734375, 52.1826171875, 53.5625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 8.0, 20.0, 23.0, 51.0, 113.0, 154.0, 336.0, 757.0, 1787.0, 4916.0, 17099.0, 166253.0, 3896909.0, 85715.0, 13379.0, 4048.0, 1433.0, 628.0, 285.0, 148.0, 81.0, 52.0, 34.0, 13.0, 8.0, 7.0, 3.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-92.0625, -89.66552734375, -87.2685546875, -84.87158203125, -82.474609375, -80.07763671875, -77.6806640625, -75.28369140625, -72.88671875, -70.48974609375, -68.0927734375, -65.69580078125, -63.298828125, -60.90185546875, -58.5048828125, -56.10791015625, -53.7109375, -51.31396484375, -48.9169921875, -46.52001953125, -44.123046875, -41.72607421875, -39.3291015625, -36.93212890625, -34.53515625, -32.13818359375, -29.7412109375, -27.34423828125, -24.947265625, -22.55029296875, -20.1533203125, -17.75634765625, -15.359375, -12.96240234375, -10.5654296875, -8.16845703125, -5.771484375, -3.37451171875, -0.9775390625, 1.41943359375, 3.81640625, 6.21337890625, 8.6103515625, 11.00732421875, 13.404296875, 15.80126953125, 18.1982421875, 20.59521484375, 22.9921875, 25.38916015625, 27.7861328125, 30.18310546875, 32.580078125, 34.97705078125, 37.3740234375, 39.77099609375, 42.16796875, 44.56494140625, 46.9619140625, 49.35888671875, 51.755859375, 54.15283203125, 56.5498046875, 58.94677734375, 61.34375]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 10.0, 9.0, 7.0, 12.0, 23.0, 26.0, 39.0, 53.0, 101.0, 110.0, 159.0, 126.0, 88.0, 67.0, 54.0, 27.0, 32.0, 14.0, 14.0, 9.0, 9.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.91526794433594, -69.05793762207031, -65.20060729980469, -61.34326934814453, -57.485939025878906, -53.62860870361328, -49.77127456665039, -45.9139404296875, -42.056610107421875, -38.19927978515625, -34.34194564819336, -30.4846134185791, -26.627281188964844, -22.769948959350586, -18.912616729736328, -15.05528450012207, -11.197952270507812, -7.340620040893555, -3.483287811279297, 0.37404441833496094, 4.231376647949219, 8.088708877563477, 11.946041107177734, 15.803373336791992, 19.66070556640625, 23.518037796020508, 27.375370025634766, 31.232702255249023, 35.09003448486328, 38.947364807128906, 42.8046989440918, 46.66203308105469, 50.51936340332031, 54.37669372558594, 58.23402786254883, 62.09136199951172, 65.94869232177734, 69.80602264404297, 73.66336059570312, 77.52069091796875, 81.37802124023438, 85.2353515625, 89.09268188476562, 92.95001983642578, 96.8073501586914, 100.66468048095703, 104.52201843261719, 108.37934875488281, 112.23667907714844, 116.09400939941406, 119.95133972167969, 123.80867767333984, 127.66600799560547, 131.52334594726562, 135.38067626953125, 139.23800659179688, 143.0953369140625, 146.95266723632812, 150.80999755859375, 154.66732788085938, 158.524658203125, 162.3820037841797, 166.2393341064453, 170.09666442871094, 173.95399475097656]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 5.0, 2.0, 4.0, 13.0, 7.0, 15.0, 16.0, 18.0, 22.0, 17.0, 25.0, 26.0, 23.0, 15.0, 29.0, 29.0, 32.0, 38.0, 37.0, 35.0, 30.0, 34.0, 36.0, 39.0, 39.0, 36.0, 31.0, 28.0, 25.0, 37.0, 26.0, 25.0, 31.0, 21.0, 15.0, 14.0, 21.0, 15.0, 12.0, 11.0, 15.0, 15.0, 9.0, 4.0, 8.0, 6.0, 4.0, 3.0, 2.0, 4.0, 1.0, 3.0], "bins": [-80.27215576171875, -77.94873809814453, -75.62532806396484, -73.30191040039062, -70.9784927368164, -68.65507507324219, -66.3316650390625, -64.00824737548828, -61.68483352661133, -59.361419677734375, -57.038002014160156, -54.7145881652832, -52.39117431640625, -50.06775665283203, -47.74434280395508, -45.420928955078125, -43.097511291503906, -40.77409744262695, -38.450679779052734, -36.12726593017578, -33.80384826660156, -31.48043441772461, -29.157020568847656, -26.83360481262207, -24.510189056396484, -22.1867733001709, -19.863357543945312, -17.53994369506836, -15.216527938842773, -12.893112182617188, -10.569697380065918, -8.246282577514648, -5.9228668212890625, -3.5994515419006348, -1.276036262512207, 1.0473790168762207, 3.3707942962646484, 5.694210052490234, 8.017624855041504, 10.341039657592773, 12.66445541381836, 14.987871170043945, 17.31128692626953, 19.634700775146484, 21.95811653137207, 24.281532287597656, 26.60494613647461, 28.928361892700195, 31.25177764892578, 33.575191497802734, 35.89860916137695, 38.222023010253906, 40.545440673828125, 42.86885452270508, 45.19226837158203, 47.51568603515625, 49.8390998840332, 52.162513732910156, 54.485931396484375, 56.80934524536133, 59.13275909423828, 61.4561767578125, 63.77959060668945, 66.1030044555664, 68.42642211914062]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 13.0, 12.0, 14.0, 9.0, 17.0, 13.0, 18.0, 22.0, 24.0, 27.0, 24.0, 30.0, 27.0, 34.0, 37.0, 44.0, 47.0, 41.0, 38.0, 44.0, 43.0, 42.0, 44.0, 33.0, 33.0, 38.0, 31.0, 21.0, 29.0, 17.0, 22.0, 18.0, 14.0, 12.0, 13.0, 9.0, 9.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-12.8828125, -12.5006103515625, -12.118408203125, -11.7362060546875, -11.35400390625, -10.9718017578125, -10.589599609375, -10.2073974609375, -9.8251953125, -9.4429931640625, -9.060791015625, -8.6785888671875, -8.29638671875, -7.9141845703125, -7.531982421875, -7.1497802734375, -6.767578125, -6.3853759765625, -6.003173828125, -5.6209716796875, -5.23876953125, -4.8565673828125, -4.474365234375, -4.0921630859375, -3.7099609375, -3.3277587890625, -2.945556640625, -2.5633544921875, -2.18115234375, -1.7989501953125, -1.416748046875, -1.0345458984375, -0.65234375, -0.2701416015625, 0.112060546875, 0.4942626953125, 0.87646484375, 1.2586669921875, 1.640869140625, 2.0230712890625, 2.4052734375, 2.7874755859375, 3.169677734375, 3.5518798828125, 3.93408203125, 4.3162841796875, 4.698486328125, 5.0806884765625, 5.462890625, 5.8450927734375, 6.227294921875, 6.6094970703125, 6.99169921875, 7.3739013671875, 7.756103515625, 8.1383056640625, 8.5205078125, 8.9027099609375, 9.284912109375, 9.6671142578125, 10.04931640625, 10.4315185546875, 10.813720703125, 11.1959228515625, 11.578125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 5.0, 2.0, 4.0, 8.0, 12.0, 12.0, 21.0, 32.0, 44.0, 68.0, 86.0, 127.0, 141.0, 209.0, 270.0, 411.0, 584.0, 907.0, 1195.0, 1737.0, 2532.0, 3656.0, 5637.0, 8498.0, 12887.0, 20068.0, 31918.0, 51837.0, 87543.0, 156870.0, 240745.0, 171050.0, 95939.0, 55924.0, 34415.0, 21665.0, 13788.0, 8845.0, 6036.0, 3938.0, 2719.0, 1846.0, 1294.0, 885.0, 613.0, 443.0, 312.0, 219.0, 182.0, 120.0, 68.0, 53.0, 44.0, 31.0, 27.0, 19.0, 12.0, 6.0, 9.0, 2.0, 1.0, 1.0], "bins": [-1.0751953125, -1.0421905517578125, -1.009185791015625, -0.9761810302734375, -0.94317626953125, -0.9101715087890625, -0.877166748046875, -0.8441619873046875, -0.8111572265625, -0.7781524658203125, -0.745147705078125, -0.7121429443359375, -0.67913818359375, -0.6461334228515625, -0.613128662109375, -0.5801239013671875, -0.547119140625, -0.5141143798828125, -0.481109619140625, -0.4481048583984375, -0.41510009765625, -0.3820953369140625, -0.349090576171875, -0.3160858154296875, -0.2830810546875, -0.2500762939453125, -0.217071533203125, -0.1840667724609375, -0.15106201171875, -0.1180572509765625, -0.085052490234375, -0.0520477294921875, -0.01904296875, 0.0139617919921875, 0.046966552734375, 0.0799713134765625, 0.11297607421875, 0.1459808349609375, 0.178985595703125, 0.2119903564453125, 0.2449951171875, 0.2779998779296875, 0.311004638671875, 0.3440093994140625, 0.37701416015625, 0.4100189208984375, 0.443023681640625, 0.4760284423828125, 0.509033203125, 0.5420379638671875, 0.575042724609375, 0.6080474853515625, 0.64105224609375, 0.6740570068359375, 0.707061767578125, 0.7400665283203125, 0.7730712890625, 0.8060760498046875, 0.839080810546875, 0.8720855712890625, 0.90509033203125, 0.9380950927734375, 0.971099853515625, 1.0041046142578125, 1.037109375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 4.0, 2.0, 8.0, 8.0, 12.0, 15.0, 12.0, 17.0, 14.0, 18.0, 26.0, 26.0, 23.0, 29.0, 38.0, 34.0, 42.0, 41.0, 40.0, 38.0, 1069.0, 41.0, 38.0, 58.0, 33.0, 44.0, 31.0, 30.0, 31.0, 34.0, 29.0, 32.0, 14.0, 14.0, 10.0, 12.0, 10.0, 17.0, 5.0, 5.0, 6.0, 5.0, 2.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.5390625, -7.2952880859375, -7.051513671875, -6.8077392578125, -6.56396484375, -6.3201904296875, -6.076416015625, -5.8326416015625, -5.5888671875, -5.3450927734375, -5.101318359375, -4.8575439453125, -4.61376953125, -4.3699951171875, -4.126220703125, -3.8824462890625, -3.638671875, -3.3948974609375, -3.151123046875, -2.9073486328125, -2.66357421875, -2.4197998046875, -2.176025390625, -1.9322509765625, -1.6884765625, -1.4447021484375, -1.200927734375, -0.9571533203125, -0.71337890625, -0.4696044921875, -0.225830078125, 0.0179443359375, 0.26171875, 0.5054931640625, 0.749267578125, 0.9930419921875, 1.23681640625, 1.4805908203125, 1.724365234375, 1.9681396484375, 2.2119140625, 2.4556884765625, 2.699462890625, 2.9432373046875, 3.18701171875, 3.4307861328125, 3.674560546875, 3.9183349609375, 4.162109375, 4.4058837890625, 4.649658203125, 4.8934326171875, 5.13720703125, 5.3809814453125, 5.624755859375, 5.8685302734375, 6.1123046875, 6.3560791015625, 6.599853515625, 6.8436279296875, 7.08740234375, 7.3311767578125, 7.574951171875, 7.8187255859375, 8.0625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 6.0, 10.0, 14.0, 16.0, 29.0, 41.0, 56.0, 87.0, 113.0, 202.0, 303.0, 500.0, 809.0, 1346.0, 2213.0, 4021.0, 7027.0, 12390.0, 22745.0, 42946.0, 86529.0, 197274.0, 1373392.0, 178027.0, 79198.0, 39526.0, 21167.0, 11408.0, 6396.0, 3874.0, 2099.0, 1261.0, 760.0, 455.0, 317.0, 213.0, 129.0, 77.0, 40.0, 38.0, 27.0, 21.0, 8.0, 8.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34375, -1.3010101318359375, -1.258270263671875, -1.2155303955078125, -1.17279052734375, -1.1300506591796875, -1.087310791015625, -1.0445709228515625, -1.0018310546875, -0.9590911865234375, -0.916351318359375, -0.8736114501953125, -0.83087158203125, -0.7881317138671875, -0.745391845703125, -0.7026519775390625, -0.659912109375, -0.6171722412109375, -0.574432373046875, -0.5316925048828125, -0.48895263671875, -0.4462127685546875, -0.403472900390625, -0.3607330322265625, -0.3179931640625, -0.2752532958984375, -0.232513427734375, -0.1897735595703125, -0.14703369140625, -0.1042938232421875, -0.061553955078125, -0.0188140869140625, 0.02392578125, 0.0666656494140625, 0.109405517578125, 0.1521453857421875, 0.19488525390625, 0.2376251220703125, 0.280364990234375, 0.3231048583984375, 0.3658447265625, 0.4085845947265625, 0.451324462890625, 0.4940643310546875, 0.53680419921875, 0.5795440673828125, 0.622283935546875, 0.6650238037109375, 0.707763671875, 0.7505035400390625, 0.793243408203125, 0.8359832763671875, 0.87872314453125, 0.9214630126953125, 0.964202880859375, 1.0069427490234375, 1.0496826171875, 1.0924224853515625, 1.135162353515625, 1.1779022216796875, 1.22064208984375, 1.2633819580078125, 1.306121826171875, 1.3488616943359375, 1.3916015625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 11.0, 4.0, 6.0, 8.0, 12.0, 12.0, 19.0, 22.0, 20.0, 31.0, 35.0, 44.0, 58.0, 45.0, 60.0, 63.0, 55.0, 55.0, 54.0, 62.0, 44.0, 41.0, 36.0, 36.0, 28.0, 26.0, 29.0, 14.0, 8.0, 11.0, 8.0, 4.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.002986907958984375, -0.002895176410675049, -0.0028034448623657227, -0.0027117133140563965, -0.0026199817657470703, -0.002528250217437744, -0.002436518669128418, -0.002344787120819092, -0.0022530555725097656, -0.0021613240242004395, -0.0020695924758911133, -0.001977860927581787, -0.001886129379272461, -0.0017943978309631348, -0.0017026662826538086, -0.0016109347343444824, -0.0015192031860351562, -0.00142747163772583, -0.001335740089416504, -0.0012440085411071777, -0.0011522769927978516, -0.0010605454444885254, -0.0009688138961791992, -0.000877082347869873, -0.0007853507995605469, -0.0006936192512512207, -0.0006018877029418945, -0.0005101561546325684, -0.0004184246063232422, -0.000326693058013916, -0.00023496150970458984, -0.00014322996139526367, -5.14984130859375e-05, 4.023313522338867e-05, 0.00013196468353271484, 0.00022369623184204102, 0.0003154277801513672, 0.00040715932846069336, 0.0004988908767700195, 0.0005906224250793457, 0.0006823539733886719, 0.000774085521697998, 0.0008658170700073242, 0.0009575486183166504, 0.0010492801666259766, 0.0011410117149353027, 0.001232743263244629, 0.001324474811553955, 0.0014162063598632812, 0.0015079379081726074, 0.0015996694564819336, 0.0016914010047912598, 0.001783132553100586, 0.0018748641014099121, 0.0019665956497192383, 0.0020583271980285645, 0.0021500587463378906, 0.002241790294647217, 0.002333521842956543, 0.002425253391265869, 0.0025169849395751953, 0.0026087164878845215, 0.0027004480361938477, 0.002792179584503174, 0.0028839111328125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 9.0, 2.0, 6.0, 18.0, 23.0, 22.0, 28.0, 49.0, 46.0, 73.0, 108.0, 129.0, 246.0, 550.0, 3632.0, 637510.0, 402033.0, 2798.0, 521.0, 243.0, 132.0, 96.0, 62.0, 47.0, 40.0, 31.0, 19.0, 8.0, 22.0, 13.0, 7.0, 6.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.060394287109375, -0.058443546295166016, -0.05649280548095703, -0.05454206466674805, -0.05259132385253906, -0.05064058303833008, -0.048689842224121094, -0.04673910140991211, -0.044788360595703125, -0.04283761978149414, -0.040886878967285156, -0.03893613815307617, -0.03698539733886719, -0.0350346565246582, -0.03308391571044922, -0.031133174896240234, -0.02918243408203125, -0.027231693267822266, -0.02528095245361328, -0.023330211639404297, -0.021379470825195312, -0.019428730010986328, -0.017477989196777344, -0.01552724838256836, -0.013576507568359375, -0.01162576675415039, -0.009675025939941406, -0.007724285125732422, -0.0057735443115234375, -0.003822803497314453, -0.0018720626831054688, 7.867813110351562e-05, 0.0020294189453125, 0.003980159759521484, 0.005930900573730469, 0.007881641387939453, 0.009832382202148438, 0.011783123016357422, 0.013733863830566406, 0.01568460464477539, 0.017635345458984375, 0.01958608627319336, 0.021536827087402344, 0.023487567901611328, 0.025438308715820312, 0.027389049530029297, 0.02933979034423828, 0.031290531158447266, 0.03324127197265625, 0.035192012786865234, 0.03714275360107422, 0.0390934944152832, 0.04104423522949219, 0.04299497604370117, 0.044945716857910156, 0.04689645767211914, 0.048847198486328125, 0.05079793930053711, 0.052748680114746094, 0.05469942092895508, 0.05665016174316406, 0.05860090255737305, 0.06055164337158203, 0.06250238418579102, 0.064453125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 27.0, 179.0, 552.0, 204.0, 42.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005370369181036949, -0.0050246440805494785, -0.004678918980062008, -0.00433319341391325, -0.003987468313425779, -0.0036417432129383087, -0.003296018112450838, -0.002950292779132724, -0.002604567678645253, -0.0022588425781577826, -0.0019131172448396683, -0.0015673921443521976, -0.0012216669274494052, -0.0008759417105466127, -0.0005302166100591421, -0.00018449127674102783, 0.0001612338237464428, 0.0005069590406492352, 0.0008526841993443668, 0.0011984093580394983, 0.0015441345749422908, 0.0018898597918450832, 0.002235584892332554, 0.002581310225650668, 0.0029270353261381388, 0.0032727604266256094, 0.0036184857599437237, 0.003964210860431194, 0.004309935960918665, 0.0046556610614061356, 0.0050013866275548935, 0.005347111728042364, 0.005692836828529835, 0.006038561929017305, 0.006384287029504776, 0.006730012595653534, 0.0070757376961410046, 0.007421462796628475, 0.007767187897115946, 0.008112912997603416, 0.008458638563752174, 0.008804364129900932, 0.009150088764727116, 0.009495814330875874, 0.009841538965702057, 0.010187264531850815, 0.010532990097999573, 0.010878714732825756, 0.01122443936765194, 0.011570164933800697, 0.01191588956862688, 0.012261615134775639, 0.012607339769601822, 0.01295306533575058, 0.013298790901899338, 0.013644515536725521, 0.013990241102874279, 0.014335966669023037, 0.01468169130384922, 0.015027416869997978, 0.015373141504824162, 0.015718866139650345, 0.016064591705799103, 0.01641031727194786, 0.01675604283809662]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 13.0, 6.0, 8.0, 8.0, 10.0, 19.0, 8.0, 18.0, 20.0, 24.0, 29.0, 24.0, 30.0, 41.0, 32.0, 42.0, 41.0, 48.0, 41.0, 43.0, 30.0, 47.0, 43.0, 34.0, 45.0, 27.0, 28.0, 36.0, 30.0, 26.0, 26.0, 21.0, 19.0, 16.0, 16.0, 14.0, 12.0, 9.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0019225478172302246, -0.0018704747781157494, -0.0018184017390012741, -0.0017663286998867989, -0.0017142556607723236, -0.0016621826216578484, -0.001610109582543373, -0.0015580365434288979, -0.0015059635043144226, -0.0014538904651999474, -0.001401817426085472, -0.0013497443869709969, -0.0012976713478565216, -0.0012455983087420464, -0.001193525269627571, -0.0011414522305130959, -0.0010893791913986206, -0.0010373061522841454, -0.00098523311316967, -0.0009331600740551949, -0.0008810870349407196, -0.0008290139958262444, -0.0007769409567117691, -0.0007248679175972939, -0.0006727948784828186, -0.0006207218393683434, -0.0005686488002538681, -0.0005165757611393929, -0.0004645027220249176, -0.00041242968291044235, -0.0003603566437959671, -0.00030828360468149185, -0.0002562105655670166, -0.00020413752645254135, -0.0001520644873380661, -9.999144822359085e-05, -4.79184091091156e-05, 4.15463000535965e-06, 5.62276691198349e-05, 0.00010830070823431015, 0.0001603737473487854, 0.00021244678646326065, 0.0002645198255777359, 0.00031659286469221115, 0.0003686659038066864, 0.00042073894292116165, 0.0004728119820356369, 0.0005248850211501122, 0.0005769580602645874, 0.0006290310993790627, 0.0006811041384935379, 0.0007331771776080132, 0.0007852502167224884, 0.0008373232558369637, 0.0008893962949514389, 0.0009414693340659142, 0.0009935423731803894, 0.0010456154122948647, 0.00109768845140934, 0.0011497614905238152, 0.0012018345296382904, 0.0012539075687527657, 0.001305980607867241, 0.0013580536469817162, 0.0014101266860961914]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 5.0, 2.0, 2.0, 13.0, 12.0, 14.0, 9.0, 17.0, 13.0, 18.0, 22.0, 24.0, 27.0, 24.0, 30.0, 27.0, 34.0, 37.0, 44.0, 47.0, 41.0, 38.0, 44.0, 43.0, 42.0, 44.0, 33.0, 33.0, 38.0, 31.0, 21.0, 29.0, 17.0, 22.0, 18.0, 14.0, 12.0, 13.0, 9.0, 9.0, 6.0, 4.0, 3.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-12.8828125, -12.5006103515625, -12.118408203125, -11.7362060546875, -11.35400390625, -10.9718017578125, -10.589599609375, -10.2073974609375, -9.8251953125, -9.4429931640625, -9.060791015625, -8.6785888671875, -8.29638671875, -7.9141845703125, -7.531982421875, -7.1497802734375, -6.767578125, -6.3853759765625, -6.003173828125, -5.6209716796875, -5.23876953125, -4.8565673828125, -4.474365234375, -4.0921630859375, -3.7099609375, -3.3277587890625, -2.945556640625, -2.5633544921875, -2.18115234375, -1.7989501953125, -1.416748046875, -1.0345458984375, -0.65234375, -0.2701416015625, 0.112060546875, 0.4942626953125, 0.87646484375, 1.2586669921875, 1.640869140625, 2.0230712890625, 2.4052734375, 2.7874755859375, 3.169677734375, 3.5518798828125, 3.93408203125, 4.3162841796875, 4.698486328125, 5.0806884765625, 5.462890625, 5.8450927734375, 6.227294921875, 6.6094970703125, 6.99169921875, 7.3739013671875, 7.756103515625, 8.1383056640625, 8.5205078125, 8.9027099609375, 9.284912109375, 9.6671142578125, 10.04931640625, 10.4315185546875, 10.813720703125, 11.1959228515625, 11.578125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 1.0, 0.0, 2.0, 5.0, 2.0, 7.0, 15.0, 9.0, 18.0, 10.0, 24.0, 39.0, 51.0, 71.0, 86.0, 102.0, 160.0, 269.0, 360.0, 542.0, 861.0, 1406.0, 2526.0, 4667.0, 9552.0, 21000.0, 54047.0, 162534.0, 441654.0, 225523.0, 71468.0, 26751.0, 11629.0, 5608.0, 2930.0, 1686.0, 978.0, 616.0, 401.0, 273.0, 193.0, 126.0, 96.0, 74.0, 52.0, 40.0, 29.0, 13.0, 12.0, 14.0, 9.0, 3.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.4375, -7.202392578125, -6.96728515625, -6.732177734375, -6.4970703125, -6.261962890625, -6.02685546875, -5.791748046875, -5.556640625, -5.321533203125, -5.08642578125, -4.851318359375, -4.6162109375, -4.381103515625, -4.14599609375, -3.910888671875, -3.67578125, -3.440673828125, -3.20556640625, -2.970458984375, -2.7353515625, -2.500244140625, -2.26513671875, -2.030029296875, -1.794921875, -1.559814453125, -1.32470703125, -1.089599609375, -0.8544921875, -0.619384765625, -0.38427734375, -0.149169921875, 0.0859375, 0.321044921875, 0.55615234375, 0.791259765625, 1.0263671875, 1.261474609375, 1.49658203125, 1.731689453125, 1.966796875, 2.201904296875, 2.43701171875, 2.672119140625, 2.9072265625, 3.142333984375, 3.37744140625, 3.612548828125, 3.84765625, 4.082763671875, 4.31787109375, 4.552978515625, 4.7880859375, 5.023193359375, 5.25830078125, 5.493408203125, 5.728515625, 5.963623046875, 6.19873046875, 6.433837890625, 6.6689453125, 6.904052734375, 7.13916015625, 7.374267578125, 7.609375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 4.0, 3.0, 11.0, 7.0, 16.0, 15.0, 12.0, 13.0, 26.0, 23.0, 33.0, 42.0, 35.0, 46.0, 48.0, 57.0, 87.0, 404.0, 1638.0, 85.0, 49.0, 52.0, 42.0, 35.0, 54.0, 33.0, 28.0, 23.0, 27.0, 19.0, 15.0, 15.0, 11.0, 14.0, 4.0, 9.0, 3.0, 2.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-44.875, -43.3828125, -41.890625, -40.3984375, -38.90625, -37.4140625, -35.921875, -34.4296875, -32.9375, -31.4453125, -29.953125, -28.4609375, -26.96875, -25.4765625, -23.984375, -22.4921875, -21.0, -19.5078125, -18.015625, -16.5234375, -15.03125, -13.5390625, -12.046875, -10.5546875, -9.0625, -7.5703125, -6.078125, -4.5859375, -3.09375, -1.6015625, -0.109375, 1.3828125, 2.875, 4.3671875, 5.859375, 7.3515625, 8.84375, 10.3359375, 11.828125, 13.3203125, 14.8125, 16.3046875, 17.796875, 19.2890625, 20.78125, 22.2734375, 23.765625, 25.2578125, 26.75, 28.2421875, 29.734375, 31.2265625, 32.71875, 34.2109375, 35.703125, 37.1953125, 38.6875, 40.1796875, 41.671875, 43.1640625, 44.65625, 46.1484375, 47.640625, 49.1328125, 50.625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 3.0, 12.0, 7.0, 14.0, 13.0, 16.0, 18.0, 33.0, 43.0, 44.0, 70.0, 85.0, 109.0, 132.0, 204.0, 301.0, 571.0, 2844.0, 3075266.0, 63349.0, 1245.0, 450.0, 240.0, 169.0, 123.0, 91.0, 62.0, 42.0, 44.0, 20.0, 16.0, 16.0, 14.0, 14.0, 7.0, 3.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.875, -111.4765625, -108.078125, -104.6796875, -101.28125, -97.8828125, -94.484375, -91.0859375, -87.6875, -84.2890625, -80.890625, -77.4921875, -74.09375, -70.6953125, -67.296875, -63.8984375, -60.5, -57.1015625, -53.703125, -50.3046875, -46.90625, -43.5078125, -40.109375, -36.7109375, -33.3125, -29.9140625, -26.515625, -23.1171875, -19.71875, -16.3203125, -12.921875, -9.5234375, -6.125, -2.7265625, 0.671875, 4.0703125, 7.46875, 10.8671875, 14.265625, 17.6640625, 21.0625, 24.4609375, 27.859375, 31.2578125, 34.65625, 38.0546875, 41.453125, 44.8515625, 48.25, 51.6484375, 55.046875, 58.4453125, 61.84375, 65.2421875, 68.640625, 72.0390625, 75.4375, 78.8359375, 82.234375, 85.6328125, 89.03125, 92.4296875, 95.828125, 99.2265625, 102.625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 173.0, 764.0, 74.0, 3.0], "bins": [-425.7110290527344, -418.7750244140625, -411.8389892578125, -404.9029846191406, -397.96697998046875, -391.03094482421875, -384.0949401855469, -377.158935546875, -370.222900390625, -363.2868957519531, -356.3508605957031, -349.41485595703125, -342.4788513183594, -335.5428161621094, -328.6068115234375, -321.6708068847656, -314.73480224609375, -307.7987976074219, -300.8627624511719, -293.9267578125, -286.9907531738281, -280.0547180175781, -273.11871337890625, -266.1827087402344, -259.2466735839844, -252.31065368652344, -245.37464904785156, -238.43862915039062, -231.5026092529297, -224.5666046142578, -217.63058471679688, -210.694580078125, -203.75857543945312, -196.8225555419922, -189.8865509033203, -182.95053100585938, -176.01451110839844, -169.07850646972656, -162.14248657226562, -155.20648193359375, -148.27044677734375, -141.3344268798828, -134.39842224121094, -127.46240234375, -120.5263900756836, -113.59037780761719, -106.65435791015625, -99.71834564208984, -92.78233337402344, -85.84632110595703, -78.9103012084961, -71.97428894042969, -65.03827667236328, -58.10226058959961, -51.16624450683594, -44.23023223876953, -37.29421615600586, -30.35820198059082, -23.42218780517578, -16.48617172241211, -9.55015754699707, -2.6141433715820312, 4.321872711181641, 11.257884979248047, 18.19390106201172]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 10.0, 16.0, 18.0, 19.0, 22.0, 19.0, 22.0, 28.0, 39.0, 43.0, 29.0, 33.0, 44.0, 49.0, 44.0, 37.0, 46.0, 30.0, 40.0, 36.0, 41.0, 38.0, 32.0, 29.0, 30.0, 19.0, 27.0, 23.0, 24.0, 19.0, 14.0, 12.0, 3.0, 7.0, 11.0, 1.0, 4.0, 4.0, 2.0, 1.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.50714111328125, -104.33348083496094, -101.15982055664062, -97.98616027832031, -94.8125, -91.63883209228516, -88.46517181396484, -85.29151153564453, -82.11785125732422, -78.9441909790039, -75.7705307006836, -72.59687042236328, -69.42320251464844, -66.24954223632812, -63.07588195800781, -59.9022216796875, -56.72856140136719, -53.554901123046875, -50.38124084472656, -47.207576751708984, -44.03391647338867, -40.86025619506836, -37.68659210205078, -34.51293182373047, -31.339271545410156, -28.165611267089844, -24.9919490814209, -21.818286895751953, -18.64462661743164, -15.470965385437012, -12.297304153442383, -9.123641967773438, -5.949981689453125, -2.776320457458496, 0.3973407745361328, 3.5710020065307617, 6.744663238525391, 9.91832447052002, 13.091985702514648, 16.265647888183594, 19.439308166503906, 22.61296844482422, 25.786630630493164, 28.96029281616211, 32.13395309448242, 35.307613372802734, 38.48127746582031, 41.654937744140625, 44.82859802246094, 48.00225830078125, 51.17591857910156, 54.34958267211914, 57.52324295043945, 60.696903228759766, 63.870567321777344, 67.04422760009766, 70.21788787841797, 73.39154815673828, 76.5652084350586, 79.7388687133789, 82.91253662109375, 86.08619689941406, 89.25985717773438, 92.43351745605469, 95.607177734375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 4.0, 4.0, 1.0, 7.0, 11.0, 12.0, 12.0, 16.0, 15.0, 17.0, 20.0, 23.0, 28.0, 27.0, 21.0, 43.0, 32.0, 36.0, 29.0, 45.0, 44.0, 46.0, 50.0, 41.0, 39.0, 39.0, 38.0, 40.0, 37.0, 33.0, 28.0, 26.0, 16.0, 18.0, 17.0, 22.0, 8.0, 12.0, 12.0, 11.0, 3.0, 1.0, 9.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-13.2265625, -12.82568359375, -12.4248046875, -12.02392578125, -11.623046875, -11.22216796875, -10.8212890625, -10.42041015625, -10.01953125, -9.61865234375, -9.2177734375, -8.81689453125, -8.416015625, -8.01513671875, -7.6142578125, -7.21337890625, -6.8125, -6.41162109375, -6.0107421875, -5.60986328125, -5.208984375, -4.80810546875, -4.4072265625, -4.00634765625, -3.60546875, -3.20458984375, -2.8037109375, -2.40283203125, -2.001953125, -1.60107421875, -1.2001953125, -0.79931640625, -0.3984375, 0.00244140625, 0.4033203125, 0.80419921875, 1.205078125, 1.60595703125, 2.0068359375, 2.40771484375, 2.80859375, 3.20947265625, 3.6103515625, 4.01123046875, 4.412109375, 4.81298828125, 5.2138671875, 5.61474609375, 6.015625, 6.41650390625, 6.8173828125, 7.21826171875, 7.619140625, 8.02001953125, 8.4208984375, 8.82177734375, 9.22265625, 9.62353515625, 10.0244140625, 10.42529296875, 10.826171875, 11.22705078125, 11.6279296875, 12.02880859375, 12.4296875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 5.0, 2.0, 5.0, 2.0, 17.0, 15.0, 7.0, 11.0, 19.0, 16.0, 22.0, 35.0, 46.0, 52.0, 70.0, 136.0, 303.0, 562.0, 1447.0, 4315.0, 27962.0, 3086900.0, 1054120.0, 12715.0, 3145.0, 1188.0, 484.0, 230.0, 132.0, 86.0, 54.0, 36.0, 17.0, 23.0, 17.0, 15.0, 9.0, 14.0, 10.0, 8.0, 8.0, 4.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0], "bins": [-60.84375, -58.9921875, -57.140625, -55.2890625, -53.4375, -51.5859375, -49.734375, -47.8828125, -46.03125, -44.1796875, -42.328125, -40.4765625, -38.625, -36.7734375, -34.921875, -33.0703125, -31.21875, -29.3671875, -27.515625, -25.6640625, -23.8125, -21.9609375, -20.109375, -18.2578125, -16.40625, -14.5546875, -12.703125, -10.8515625, -9.0, -7.1484375, -5.296875, -3.4453125, -1.59375, 0.2578125, 2.109375, 3.9609375, 5.8125, 7.6640625, 9.515625, 11.3671875, 13.21875, 15.0703125, 16.921875, 18.7734375, 20.625, 22.4765625, 24.328125, 26.1796875, 28.03125, 29.8828125, 31.734375, 33.5859375, 35.4375, 37.2890625, 39.140625, 40.9921875, 42.84375, 44.6953125, 46.546875, 48.3984375, 50.25, 52.1015625, 53.953125, 55.8046875, 57.65625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 3.0, 7.0, 8.0, 16.0, 27.0, 32.0, 61.0, 149.0, 381.0, 944.0, 1213.0, 709.0, 271.0, 112.0, 59.0, 22.0, 22.0, 12.0, 12.0, 2.0, 5.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.59375, -37.07080078125, -35.5478515625, -34.02490234375, -32.501953125, -30.97900390625, -29.4560546875, -27.93310546875, -26.41015625, -24.88720703125, -23.3642578125, -21.84130859375, -20.318359375, -18.79541015625, -17.2724609375, -15.74951171875, -14.2265625, -12.70361328125, -11.1806640625, -9.65771484375, -8.134765625, -6.61181640625, -5.0888671875, -3.56591796875, -2.04296875, -0.52001953125, 1.0029296875, 2.52587890625, 4.048828125, 5.57177734375, 7.0947265625, 8.61767578125, 10.140625, 11.66357421875, 13.1865234375, 14.70947265625, 16.232421875, 17.75537109375, 19.2783203125, 20.80126953125, 22.32421875, 23.84716796875, 25.3701171875, 26.89306640625, 28.416015625, 29.93896484375, 31.4619140625, 32.98486328125, 34.5078125, 36.03076171875, 37.5537109375, 39.07666015625, 40.599609375, 42.12255859375, 43.6455078125, 45.16845703125, 46.69140625, 48.21435546875, 49.7373046875, 51.26025390625, 52.783203125, 54.30615234375, 55.8291015625, 57.35205078125, 58.875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 9.0, 12.0, 38.0, 45.0, 110.0, 201.0, 495.0, 1637.0, 7748.0, 92551.0, 4031818.0, 51588.0, 5833.0, 1360.0, 434.0, 187.0, 88.0, 53.0, 29.0, 21.0, 7.0, 7.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-124.1875, -120.955078125, -117.72265625, -114.490234375, -111.2578125, -108.025390625, -104.79296875, -101.560546875, -98.328125, -95.095703125, -91.86328125, -88.630859375, -85.3984375, -82.166015625, -78.93359375, -75.701171875, -72.46875, -69.236328125, -66.00390625, -62.771484375, -59.5390625, -56.306640625, -53.07421875, -49.841796875, -46.609375, -43.376953125, -40.14453125, -36.912109375, -33.6796875, -30.447265625, -27.21484375, -23.982421875, -20.75, -17.517578125, -14.28515625, -11.052734375, -7.8203125, -4.587890625, -1.35546875, 1.876953125, 5.109375, 8.341796875, 11.57421875, 14.806640625, 18.0390625, 21.271484375, 24.50390625, 27.736328125, 30.96875, 34.201171875, 37.43359375, 40.666015625, 43.8984375, 47.130859375, 50.36328125, 53.595703125, 56.828125, 60.060546875, 63.29296875, 66.525390625, 69.7578125, 72.990234375, 76.22265625, 79.455078125, 82.6875]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 7.0, 8.0, 14.0, 26.0, 43.0, 71.0, 128.0, 189.0, 206.0, 134.0, 69.0, 49.0, 24.0, 14.0, 8.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-174.26254272460938, -169.29737854003906, -164.3321990966797, -159.36703491210938, -154.40187072753906, -149.4366912841797, -144.47152709960938, -139.50634765625, -134.5411834716797, -129.57601928710938, -124.61084747314453, -119.64567565917969, -114.68050384521484, -109.71533203125, -104.75016784667969, -99.78499603271484, -94.81983184814453, -89.85466003417969, -84.88949584960938, -79.92432403564453, -74.95915222167969, -69.99398803710938, -65.02881622314453, -60.06364440917969, -55.09847640991211, -50.13330841064453, -45.16813659667969, -40.20296859741211, -35.23780059814453, -30.272628784179688, -25.30746078491211, -20.342288970947266, -15.377120971679688, -10.411951065063477, -5.446782112121582, -0.4816131591796875, 4.483556747436523, 9.448726654052734, 14.413894653320312, 19.379066467285156, 24.344234466552734, 29.309404373168945, 34.274574279785156, 39.239742279052734, 44.20491027832031, 49.170082092285156, 54.135250091552734, 59.10042190551758, 64.06558990478516, 69.03076171875, 73.99592590332031, 78.96109771728516, 83.92626953125, 88.89143371582031, 93.85660552978516, 98.82177734375, 103.78694152832031, 108.75211334228516, 113.71727752685547, 118.68244934082031, 123.64762115478516, 128.61279296875, 133.5779571533203, 138.54312133789062, 143.50830078125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 7.0, 3.0, 3.0, 6.0, 6.0, 22.0, 10.0, 15.0, 15.0, 15.0, 24.0, 24.0, 35.0, 25.0, 27.0, 39.0, 32.0, 33.0, 35.0, 42.0, 44.0, 38.0, 28.0, 40.0, 34.0, 45.0, 33.0, 40.0, 38.0, 31.0, 24.0, 22.0, 22.0, 23.0, 17.0, 21.0, 13.0, 13.0, 13.0, 12.0, 7.0, 4.0, 2.0, 4.0, 3.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-72.51066589355469, -70.24317169189453, -67.97567749023438, -65.70818328857422, -63.44068908691406, -61.173194885253906, -58.90570068359375, -56.638206481933594, -54.37071228027344, -52.10321807861328, -49.835723876953125, -47.56822967529297, -45.30073547363281, -43.033241271972656, -40.7657470703125, -38.498252868652344, -36.23075866699219, -33.96326446533203, -31.695770263671875, -29.42827606201172, -27.160781860351562, -24.893287658691406, -22.62579345703125, -20.358299255371094, -18.090805053710938, -15.823310852050781, -13.555816650390625, -11.288322448730469, -9.020828247070312, -6.753334045410156, -4.48583984375, -2.2183456420898438, 0.0491485595703125, 2.3166427612304688, 4.584136962890625, 6.851631164550781, 9.119125366210938, 11.386619567871094, 13.65411376953125, 15.921607971191406, 18.189102172851562, 20.45659637451172, 22.724090576171875, 24.99158477783203, 27.259078979492188, 29.526573181152344, 31.7940673828125, 34.061561584472656, 36.32905578613281, 38.59654998779297, 40.864044189453125, 43.13153839111328, 45.39903259277344, 47.666526794433594, 49.93402099609375, 52.201515197753906, 54.46900939941406, 56.73650360107422, 59.003997802734375, 61.27149200439453, 63.53898620605469, 65.80648040771484, 68.073974609375, 70.34146881103516, 72.60896301269531]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 9.0, 12.0, 10.0, 14.0, 19.0, 19.0, 29.0, 25.0, 22.0, 31.0, 35.0, 33.0, 40.0, 48.0, 29.0, 45.0, 51.0, 40.0, 42.0, 48.0, 31.0, 41.0, 57.0, 36.0, 25.0, 29.0, 12.0, 22.0, 16.0, 19.0, 20.0, 18.0, 15.0, 7.0, 11.0, 6.0, 8.0, 4.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1484375, -13.7249755859375, -13.301513671875, -12.8780517578125, -12.45458984375, -12.0311279296875, -11.607666015625, -11.1842041015625, -10.7607421875, -10.3372802734375, -9.913818359375, -9.4903564453125, -9.06689453125, -8.6434326171875, -8.219970703125, -7.7965087890625, -7.373046875, -6.9495849609375, -6.526123046875, -6.1026611328125, -5.67919921875, -5.2557373046875, -4.832275390625, -4.4088134765625, -3.9853515625, -3.5618896484375, -3.138427734375, -2.7149658203125, -2.29150390625, -1.8680419921875, -1.444580078125, -1.0211181640625, -0.59765625, -0.1741943359375, 0.249267578125, 0.6727294921875, 1.09619140625, 1.5196533203125, 1.943115234375, 2.3665771484375, 2.7900390625, 3.2135009765625, 3.636962890625, 4.0604248046875, 4.48388671875, 4.9073486328125, 5.330810546875, 5.7542724609375, 6.177734375, 6.6011962890625, 7.024658203125, 7.4481201171875, 7.87158203125, 8.2950439453125, 8.718505859375, 9.1419677734375, 9.5654296875, 9.9888916015625, 10.412353515625, 10.8358154296875, 11.25927734375, 11.6827392578125, 12.106201171875, 12.5296630859375, 12.953125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 1.0, 3.0, 8.0, 10.0, 17.0, 21.0, 22.0, 29.0, 49.0, 68.0, 95.0, 126.0, 195.0, 264.0, 401.0, 550.0, 810.0, 1163.0, 1717.0, 2488.0, 3740.0, 5754.0, 8862.0, 14066.0, 22635.0, 37258.0, 63625.0, 116540.0, 216999.0, 239242.0, 130992.0, 71069.0, 40922.0, 24621.0, 15401.0, 9706.0, 6426.0, 4154.0, 2683.0, 1800.0, 1250.0, 807.0, 608.0, 397.0, 265.0, 206.0, 159.0, 100.0, 55.0, 51.0, 33.0, 28.0, 20.0, 16.0, 15.0, 8.0, 5.0, 1.0, 4.0, 1.0, 5.0], "bins": [-1.1611328125, -1.1249542236328125, -1.088775634765625, -1.0525970458984375, -1.01641845703125, -0.9802398681640625, -0.944061279296875, -0.9078826904296875, -0.8717041015625, -0.8355255126953125, -0.799346923828125, -0.7631683349609375, -0.72698974609375, -0.6908111572265625, -0.654632568359375, -0.6184539794921875, -0.582275390625, -0.5460968017578125, -0.509918212890625, -0.4737396240234375, -0.43756103515625, -0.4013824462890625, -0.365203857421875, -0.3290252685546875, -0.2928466796875, -0.2566680908203125, -0.220489501953125, -0.1843109130859375, -0.14813232421875, -0.1119537353515625, -0.075775146484375, -0.0395965576171875, -0.00341796875, 0.0327606201171875, 0.068939208984375, 0.1051177978515625, 0.14129638671875, 0.1774749755859375, 0.213653564453125, 0.2498321533203125, 0.2860107421875, 0.3221893310546875, 0.358367919921875, 0.3945465087890625, 0.43072509765625, 0.4669036865234375, 0.503082275390625, 0.5392608642578125, 0.575439453125, 0.6116180419921875, 0.647796630859375, 0.6839752197265625, 0.72015380859375, 0.7563323974609375, 0.792510986328125, 0.8286895751953125, 0.8648681640625, 0.9010467529296875, 0.937225341796875, 0.9734039306640625, 1.00958251953125, 1.0457611083984375, 1.081939697265625, 1.1181182861328125, 1.154296875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 2.0, 10.0, 5.0, 9.0, 14.0, 13.0, 15.0, 10.0, 17.0, 19.0, 19.0, 28.0, 28.0, 27.0, 30.0, 35.0, 43.0, 35.0, 33.0, 35.0, 28.0, 1066.0, 31.0, 26.0, 44.0, 34.0, 42.0, 37.0, 24.0, 31.0, 38.0, 34.0, 27.0, 16.0, 24.0, 17.0, 21.0, 5.0, 9.0, 4.0, 7.0, 2.0, 4.0, 4.0, 7.0, 4.0, 5.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-8.34375, -8.08917236328125, -7.8345947265625, -7.58001708984375, -7.325439453125, -7.07086181640625, -6.8162841796875, -6.56170654296875, -6.30712890625, -6.05255126953125, -5.7979736328125, -5.54339599609375, -5.288818359375, -5.03424072265625, -4.7796630859375, -4.52508544921875, -4.2705078125, -4.01593017578125, -3.7613525390625, -3.50677490234375, -3.252197265625, -2.99761962890625, -2.7430419921875, -2.48846435546875, -2.23388671875, -1.97930908203125, -1.7247314453125, -1.47015380859375, -1.215576171875, -0.96099853515625, -0.7064208984375, -0.45184326171875, -0.197265625, 0.05731201171875, 0.3118896484375, 0.56646728515625, 0.821044921875, 1.07562255859375, 1.3302001953125, 1.58477783203125, 1.83935546875, 2.09393310546875, 2.3485107421875, 2.60308837890625, 2.857666015625, 3.11224365234375, 3.3668212890625, 3.62139892578125, 3.8759765625, 4.13055419921875, 4.3851318359375, 4.63970947265625, 4.894287109375, 5.14886474609375, 5.4034423828125, 5.65802001953125, 5.91259765625, 6.16717529296875, 6.4217529296875, 6.67633056640625, 6.930908203125, 7.18548583984375, 7.4400634765625, 7.69464111328125, 7.94921875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 6.0, 7.0, 6.0, 9.0, 14.0, 25.0, 36.0, 45.0, 52.0, 90.0, 140.0, 200.0, 297.0, 473.0, 808.0, 1161.0, 1864.0, 2853.0, 4739.0, 7911.0, 13090.0, 22290.0, 39203.0, 72424.0, 142201.0, 1319027.0, 223345.0, 109132.0, 57331.0, 31888.0, 18316.0, 10786.0, 6595.0, 3867.0, 2543.0, 1521.0, 973.0, 633.0, 426.0, 270.0, 176.0, 115.0, 74.0, 50.0, 42.0, 25.0, 17.0, 16.0, 8.0, 9.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.3330078125, -1.291107177734375, -1.24920654296875, -1.207305908203125, -1.1654052734375, -1.123504638671875, -1.08160400390625, -1.039703369140625, -0.997802734375, -0.955902099609375, -0.91400146484375, -0.872100830078125, -0.8302001953125, -0.788299560546875, -0.74639892578125, -0.704498291015625, -0.66259765625, -0.620697021484375, -0.57879638671875, -0.536895751953125, -0.4949951171875, -0.453094482421875, -0.41119384765625, -0.369293212890625, -0.327392578125, -0.285491943359375, -0.24359130859375, -0.201690673828125, -0.1597900390625, -0.117889404296875, -0.07598876953125, -0.034088134765625, 0.0078125, 0.049713134765625, 0.09161376953125, 0.133514404296875, 0.1754150390625, 0.217315673828125, 0.25921630859375, 0.301116943359375, 0.343017578125, 0.384918212890625, 0.42681884765625, 0.468719482421875, 0.5106201171875, 0.552520751953125, 0.59442138671875, 0.636322021484375, 0.67822265625, 0.720123291015625, 0.76202392578125, 0.803924560546875, 0.8458251953125, 0.887725830078125, 0.92962646484375, 0.971527099609375, 1.013427734375, 1.055328369140625, 1.09722900390625, 1.139129638671875, 1.1810302734375, 1.222930908203125, 1.26483154296875, 1.306732177734375, 1.3486328125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 5.0, 3.0, 3.0, 10.0, 6.0, 9.0, 13.0, 17.0, 21.0, 21.0, 19.0, 20.0, 33.0, 46.0, 40.0, 56.0, 58.0, 69.0, 61.0, 58.0, 52.0, 47.0, 47.0, 48.0, 41.0, 28.0, 33.0, 24.0, 21.0, 18.0, 19.0, 7.0, 15.0, 8.0, 5.0, 2.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002628326416015625, -0.0025337636470794678, -0.0024392008781433105, -0.0023446381092071533, -0.002250075340270996, -0.002155512571334839, -0.0020609498023986816, -0.0019663870334625244, -0.0018718242645263672, -0.00177726149559021, -0.0016826987266540527, -0.0015881359577178955, -0.0014935731887817383, -0.001399010419845581, -0.0013044476509094238, -0.0012098848819732666, -0.0011153221130371094, -0.0010207593441009521, -0.0009261965751647949, -0.0008316338062286377, -0.0007370710372924805, -0.0006425082683563232, -0.000547945499420166, -0.0004533827304840088, -0.00035881996154785156, -0.00026425719261169434, -0.0001696944236755371, -7.513165473937988e-05, 1.9431114196777344e-05, 0.00011399388313293457, 0.0002085566520690918, 0.000303119421005249, 0.00039768218994140625, 0.0004922449588775635, 0.0005868077278137207, 0.0006813704967498779, 0.0007759332656860352, 0.0008704960346221924, 0.0009650588035583496, 0.0010596215724945068, 0.001154184341430664, 0.0012487471103668213, 0.0013433098793029785, 0.0014378726482391357, 0.001532435417175293, 0.0016269981861114502, 0.0017215609550476074, 0.0018161237239837646, 0.0019106864929199219, 0.002005249261856079, 0.0020998120307922363, 0.0021943747997283936, 0.0022889375686645508, 0.002383500337600708, 0.0024780631065368652, 0.0025726258754730225, 0.0026671886444091797, 0.002761751413345337, 0.002856314182281494, 0.0029508769512176514, 0.0030454397201538086, 0.003140002489089966, 0.003234565258026123, 0.0033291280269622803, 0.0034236907958984375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 7.0, 5.0, 11.0, 12.0, 8.0, 8.0, 28.0, 27.0, 30.0, 31.0, 46.0, 78.0, 98.0, 139.0, 183.0, 407.0, 1732.0, 205806.0, 834517.0, 4057.0, 550.0, 238.0, 146.0, 93.0, 73.0, 45.0, 28.0, 23.0, 32.0, 21.0, 18.0, 14.0, 9.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06561279296875, -0.0636906623840332, -0.061768531799316406, -0.05984640121459961, -0.05792427062988281, -0.056002140045166016, -0.05408000946044922, -0.05215787887573242, -0.050235748291015625, -0.04831361770629883, -0.04639148712158203, -0.044469356536865234, -0.04254722595214844, -0.04062509536743164, -0.038702964782714844, -0.03678083419799805, -0.03485870361328125, -0.03293657302856445, -0.031014442443847656, -0.02909231185913086, -0.027170181274414062, -0.025248050689697266, -0.02332592010498047, -0.021403789520263672, -0.019481658935546875, -0.017559528350830078, -0.01563739776611328, -0.013715267181396484, -0.011793136596679688, -0.00987100601196289, -0.007948875427246094, -0.006026744842529297, -0.0041046142578125, -0.002182483673095703, -0.00026035308837890625, 0.0016617774963378906, 0.0035839080810546875, 0.005506038665771484, 0.007428169250488281, 0.009350299835205078, 0.011272430419921875, 0.013194561004638672, 0.015116691589355469, 0.017038822174072266, 0.018960952758789062, 0.02088308334350586, 0.022805213928222656, 0.024727344512939453, 0.02664947509765625, 0.028571605682373047, 0.030493736267089844, 0.03241586685180664, 0.03433799743652344, 0.036260128021240234, 0.03818225860595703, 0.04010438919067383, 0.042026519775390625, 0.04394865036010742, 0.04587078094482422, 0.047792911529541016, 0.04971504211425781, 0.05163717269897461, 0.053559303283691406, 0.0554814338684082, 0.057403564453125]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 5.0, 20.0, 51.0, 143.0, 257.0, 257.0, 137.0, 78.0, 28.0, 18.0, 11.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.007392326835542917, -0.007250649854540825, -0.007108972407877445, -0.006967295426875353, -0.006825617980211973, -0.006683940999209881, -0.006542263552546501, -0.006400586571544409, -0.006258909124881029, -0.006117232143878937, -0.005975554697215557, -0.005833877716213465, -0.005692200269550085, -0.005550523288547993, -0.005408845841884613, -0.005267168860882521, -0.005125491879880428, -0.004983814898878336, -0.004842137452214956, -0.004700460471212864, -0.004558783024549484, -0.004417106043547392, -0.004275428596884012, -0.00413375161588192, -0.00399207416921854, -0.003850396955385804, -0.003708719741553068, -0.003567042527720332, -0.003425365313887596, -0.00328368810005486, -0.003142010886222124, -0.0030003339052200317, -0.002858656458556652, -0.002716979244723916, -0.00257530203089118, -0.002433624817058444, -0.002291947603225708, -0.002150270389392972, -0.002008593175560236, -0.0018669160781428218, -0.001725238747894764, -0.001583561534062028, -0.001441884320229292, -0.001300207106396556, -0.0011585298925638199, -0.0010168526787310839, -0.0008751755813136697, -0.0007334983674809337, -0.0005918211536481977, -0.00045014393981546164, -0.0003084667550865561, -0.00016678957035765052, -2.5112356524914503e-05, 0.00011656485730782151, 0.0002582420129328966, 0.00039991922676563263, 0.0005415964405983686, 0.0006832736544311047, 0.0008249508682638407, 0.0009666280238889158, 0.0011083052959293127, 0.0012499825097620487, 0.001391659607179463, 0.001533336821012199, 0.001675014034844935]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 5.0, 9.0, 3.0, 5.0, 7.0, 7.0, 16.0, 14.0, 15.0, 16.0, 18.0, 20.0, 20.0, 24.0, 30.0, 32.0, 26.0, 41.0, 40.0, 29.0, 24.0, 33.0, 42.0, 44.0, 45.0, 39.0, 32.0, 25.0, 41.0, 33.0, 26.0, 30.0, 28.0, 26.0, 24.0, 25.0, 16.0, 19.0, 10.0, 14.0, 14.0, 7.0, 3.0, 8.0, 5.0, 5.0, 4.0, 4.0, 1.0, 5.0, 2.0, 2.0], "bins": [-0.001608431339263916, -0.0015622302889823914, -0.0015160292387008667, -0.001469828188419342, -0.0014236271381378174, -0.0013774260878562927, -0.001331225037574768, -0.0012850239872932434, -0.0012388229370117188, -0.001192621886730194, -0.0011464208364486694, -0.0011002197861671448, -0.0010540187358856201, -0.0010078176856040955, -0.0009616166353225708, -0.0009154155850410461, -0.0008692145347595215, -0.0008230134844779968, -0.0007768124341964722, -0.0007306113839149475, -0.0006844103336334229, -0.0006382092833518982, -0.0005920082330703735, -0.0005458071827888489, -0.0004996061325073242, -0.00045340508222579956, -0.0004072040319442749, -0.00036100298166275024, -0.0003148019313812256, -0.00026860088109970093, -0.00022239983081817627, -0.0001761987805366516, -0.00012999773025512695, -8.37966799736023e-05, -3.759562969207764e-05, 8.605420589447021e-06, 5.480647087097168e-05, 0.00010100752115249634, 0.000147208571434021, 0.00019340962171554565, 0.0002396106719970703, 0.00028581172227859497, 0.00033201277256011963, 0.0003782138228416443, 0.00042441487312316895, 0.0004706159234046936, 0.0005168169736862183, 0.0005630180239677429, 0.0006092190742492676, 0.0006554201245307922, 0.0007016211748123169, 0.0007478222250938416, 0.0007940232753753662, 0.0008402243256568909, 0.0008864253759384155, 0.0009326264262199402, 0.0009788274765014648, 0.0010250285267829895, 0.0010712295770645142, 0.0011174306273460388, 0.0011636316776275635, 0.0012098327279090881, 0.0012560337781906128, 0.0013022348284721375, 0.0013484358787536621]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 8.0, 6.0, 9.0, 12.0, 10.0, 14.0, 19.0, 19.0, 29.0, 25.0, 22.0, 31.0, 35.0, 33.0, 40.0, 48.0, 29.0, 45.0, 51.0, 40.0, 42.0, 48.0, 31.0, 41.0, 57.0, 36.0, 25.0, 29.0, 12.0, 22.0, 16.0, 19.0, 20.0, 18.0, 15.0, 7.0, 11.0, 6.0, 8.0, 4.0, 1.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.1484375, -13.7249755859375, -13.301513671875, -12.8780517578125, -12.45458984375, -12.0311279296875, -11.607666015625, -11.1842041015625, -10.7607421875, -10.3372802734375, -9.913818359375, -9.4903564453125, -9.06689453125, -8.6434326171875, -8.219970703125, -7.7965087890625, -7.373046875, -6.9495849609375, -6.526123046875, -6.1026611328125, -5.67919921875, -5.2557373046875, -4.832275390625, -4.4088134765625, -3.9853515625, -3.5618896484375, -3.138427734375, -2.7149658203125, -2.29150390625, -1.8680419921875, -1.444580078125, -1.0211181640625, -0.59765625, -0.1741943359375, 0.249267578125, 0.6727294921875, 1.09619140625, 1.5196533203125, 1.943115234375, 2.3665771484375, 2.7900390625, 3.2135009765625, 3.636962890625, 4.0604248046875, 4.48388671875, 4.9073486328125, 5.330810546875, 5.7542724609375, 6.177734375, 6.6011962890625, 7.024658203125, 7.4481201171875, 7.87158203125, 8.2950439453125, 8.718505859375, 9.1419677734375, 9.5654296875, 9.9888916015625, 10.412353515625, 10.8358154296875, 11.25927734375, 11.6827392578125, 12.106201171875, 12.5296630859375, 12.953125]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 6.0, 6.0, 9.0, 7.0, 16.0, 18.0, 30.0, 51.0, 64.0, 90.0, 152.0, 190.0, 292.0, 488.0, 759.0, 1168.0, 1956.0, 3108.0, 5572.0, 10420.0, 23532.0, 64583.0, 212816.0, 459382.0, 169414.0, 52705.0, 19906.0, 9036.0, 5003.0, 2887.0, 1715.0, 1100.0, 698.0, 458.0, 295.0, 197.0, 139.0, 78.0, 57.0, 47.0, 35.0, 26.0, 16.0, 12.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.49609375, -7.24957275390625, -7.0030517578125, -6.75653076171875, -6.510009765625, -6.26348876953125, -6.0169677734375, -5.77044677734375, -5.52392578125, -5.27740478515625, -5.0308837890625, -4.78436279296875, -4.537841796875, -4.29132080078125, -4.0447998046875, -3.79827880859375, -3.5517578125, -3.30523681640625, -3.0587158203125, -2.81219482421875, -2.565673828125, -2.31915283203125, -2.0726318359375, -1.82611083984375, -1.57958984375, -1.33306884765625, -1.0865478515625, -0.84002685546875, -0.593505859375, -0.34698486328125, -0.1004638671875, 0.14605712890625, 0.392578125, 0.63909912109375, 0.8856201171875, 1.13214111328125, 1.378662109375, 1.62518310546875, 1.8717041015625, 2.11822509765625, 2.36474609375, 2.61126708984375, 2.8577880859375, 3.10430908203125, 3.350830078125, 3.59735107421875, 3.8438720703125, 4.09039306640625, 4.3369140625, 4.58343505859375, 4.8299560546875, 5.07647705078125, 5.322998046875, 5.56951904296875, 5.8160400390625, 6.06256103515625, 6.30908203125, 6.55560302734375, 6.8021240234375, 7.04864501953125, 7.295166015625, 7.54168701171875, 7.7882080078125, 8.03472900390625, 8.28125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 1.0, 4.0, 7.0, 2.0, 8.0, 9.0, 9.0, 7.0, 9.0, 16.0, 16.0, 21.0, 20.0, 34.0, 27.0, 34.0, 31.0, 43.0, 40.0, 40.0, 56.0, 104.0, 1707.0, 282.0, 83.0, 52.0, 44.0, 44.0, 31.0, 27.0, 34.0, 39.0, 23.0, 30.0, 19.0, 17.0, 16.0, 9.0, 15.0, 10.0, 6.0, 11.0, 3.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-41.34375, -40.00146484375, -38.6591796875, -37.31689453125, -35.974609375, -34.63232421875, -33.2900390625, -31.94775390625, -30.60546875, -29.26318359375, -27.9208984375, -26.57861328125, -25.236328125, -23.89404296875, -22.5517578125, -21.20947265625, -19.8671875, -18.52490234375, -17.1826171875, -15.84033203125, -14.498046875, -13.15576171875, -11.8134765625, -10.47119140625, -9.12890625, -7.78662109375, -6.4443359375, -5.10205078125, -3.759765625, -2.41748046875, -1.0751953125, 0.26708984375, 1.609375, 2.95166015625, 4.2939453125, 5.63623046875, 6.978515625, 8.32080078125, 9.6630859375, 11.00537109375, 12.34765625, 13.68994140625, 15.0322265625, 16.37451171875, 17.716796875, 19.05908203125, 20.4013671875, 21.74365234375, 23.0859375, 24.42822265625, 25.7705078125, 27.11279296875, 28.455078125, 29.79736328125, 31.1396484375, 32.48193359375, 33.82421875, 35.16650390625, 36.5087890625, 37.85107421875, 39.193359375, 40.53564453125, 41.8779296875, 43.22021484375, 44.5625]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 9.0, 8.0, 12.0, 6.0, 22.0, 22.0, 23.0, 34.0, 53.0, 75.0, 100.0, 131.0, 204.0, 375.0, 915.0, 6259.0, 3114244.0, 20756.0, 1330.0, 407.0, 211.0, 136.0, 111.0, 71.0, 53.0, 41.0, 19.0, 17.0, 17.0, 16.0, 8.0, 9.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-133.375, -129.41015625, -125.4453125, -121.48046875, -117.515625, -113.55078125, -109.5859375, -105.62109375, -101.65625, -97.69140625, -93.7265625, -89.76171875, -85.796875, -81.83203125, -77.8671875, -73.90234375, -69.9375, -65.97265625, -62.0078125, -58.04296875, -54.078125, -50.11328125, -46.1484375, -42.18359375, -38.21875, -34.25390625, -30.2890625, -26.32421875, -22.359375, -18.39453125, -14.4296875, -10.46484375, -6.5, -2.53515625, 1.4296875, 5.39453125, 9.359375, 13.32421875, 17.2890625, 21.25390625, 25.21875, 29.18359375, 33.1484375, 37.11328125, 41.078125, 45.04296875, 49.0078125, 52.97265625, 56.9375, 60.90234375, 64.8671875, 68.83203125, 72.796875, 76.76171875, 80.7265625, 84.69140625, 88.65625, 92.62109375, 96.5859375, 100.55078125, 104.515625, 108.48046875, 112.4453125, 116.41015625, 120.375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 30.0, 292.0, 598.0, 86.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.131656646728516, -27.649250030517578, -21.166845321655273, -14.684440612792969, -8.202033996582031, -1.7196273803710938, 4.762775421142578, 11.245182037353516, 17.727588653564453, 24.20999526977539, 30.692399978637695, 37.1748046875, 43.65721130371094, 50.139617919921875, 56.62202072143555, 63.104427337646484, 69.58683776855469, 76.06924438476562, 82.55165100097656, 89.0340576171875, 95.51646423339844, 101.99887084960938, 108.48126983642578, 114.96367645263672, 121.44607543945312, 127.92848205566406, 134.410888671875, 140.89329528808594, 147.37570190429688, 153.8581085205078, 160.34051513671875, 166.82290649414062, 173.30532836914062, 179.78773498535156, 186.2701416015625, 192.75254821777344, 199.23495483398438, 205.7173614501953, 212.19976806640625, 218.68215942382812, 225.16458129882812, 231.64698791503906, 238.12939453125, 244.61180114746094, 251.09420776367188, 257.57659912109375, 264.05902099609375, 270.5414123535156, 277.0238037109375, 283.5061950683594, 289.9886169433594, 296.47100830078125, 302.95343017578125, 309.4358215332031, 315.9182434082031, 322.400634765625, 328.883056640625, 335.3654479980469, 341.8478698730469, 348.33026123046875, 354.81268310546875, 361.2950744628906, 367.7774963378906, 374.2598876953125, 380.7423095703125]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 6.0, 2.0, 7.0, 10.0, 9.0, 12.0, 11.0, 18.0, 19.0, 22.0, 26.0, 29.0, 33.0, 31.0, 33.0, 35.0, 28.0, 40.0, 32.0, 28.0, 50.0, 43.0, 44.0, 46.0, 37.0, 44.0, 30.0, 32.0, 33.0, 31.0, 28.0, 31.0, 17.0, 19.0, 15.0, 8.0, 11.0, 6.0, 9.0, 10.0, 5.0, 8.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0], "bins": [-139.11285400390625, -135.02622985839844, -130.93959045410156, -126.85296630859375, -122.7663345336914, -118.67970275878906, -114.59307098388672, -110.50643920898438, -106.41981506347656, -102.33318328857422, -98.24655151367188, -94.15992736816406, -90.07329559326172, -85.98666381835938, -81.90003204345703, -77.81340026855469, -73.72676849365234, -69.64013671875, -65.55350494384766, -61.46687698364258, -57.3802490234375, -53.293617248535156, -49.20698547363281, -45.12035369873047, -41.03372573852539, -36.94709396362305, -32.86046600341797, -28.773834228515625, -24.687204360961914, -20.600574493408203, -16.51394271850586, -12.427312850952148, -8.340682983398438, -4.254052639007568, -0.16742229461669922, 3.919208526611328, 8.005838394165039, 12.09246826171875, 16.179100036621094, 20.265729904174805, 24.352359771728516, 28.438989639282227, 32.52561950683594, 36.61225128173828, 40.698883056640625, 44.7855110168457, 48.87214279174805, 52.958770751953125, 57.04540252685547, 61.13203430175781, 65.21866607666016, 69.3052978515625, 73.39192199707031, 77.47855377197266, 81.565185546875, 85.65181732177734, 89.73844909667969, 93.82508087158203, 97.91171264648438, 101.99833679199219, 106.08496856689453, 110.17160034179688, 114.25823211669922, 118.34486389160156, 122.43148803710938]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 9.0, 7.0, 9.0, 12.0, 17.0, 18.0, 19.0, 24.0, 25.0, 25.0, 31.0, 31.0, 42.0, 38.0, 42.0, 46.0, 44.0, 34.0, 54.0, 42.0, 41.0, 40.0, 42.0, 40.0, 39.0, 34.0, 26.0, 20.0, 17.0, 22.0, 22.0, 11.0, 14.0, 22.0, 5.0, 7.0, 6.0, 6.0, 7.0, 2.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-15.4375, -14.9892578125, -14.541015625, -14.0927734375, -13.64453125, -13.1962890625, -12.748046875, -12.2998046875, -11.8515625, -11.4033203125, -10.955078125, -10.5068359375, -10.05859375, -9.6103515625, -9.162109375, -8.7138671875, -8.265625, -7.8173828125, -7.369140625, -6.9208984375, -6.47265625, -6.0244140625, -5.576171875, -5.1279296875, -4.6796875, -4.2314453125, -3.783203125, -3.3349609375, -2.88671875, -2.4384765625, -1.990234375, -1.5419921875, -1.09375, -0.6455078125, -0.197265625, 0.2509765625, 0.69921875, 1.1474609375, 1.595703125, 2.0439453125, 2.4921875, 2.9404296875, 3.388671875, 3.8369140625, 4.28515625, 4.7333984375, 5.181640625, 5.6298828125, 6.078125, 6.5263671875, 6.974609375, 7.4228515625, 7.87109375, 8.3193359375, 8.767578125, 9.2158203125, 9.6640625, 10.1123046875, 10.560546875, 11.0087890625, 11.45703125, 11.9052734375, 12.353515625, 12.8017578125, 13.25]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 1.0, 2.0, 14.0, 6.0, 12.0, 9.0, 19.0, 23.0, 29.0, 38.0, 43.0, 64.0, 112.0, 175.0, 354.0, 694.0, 1565.0, 4465.0, 21801.0, 2071102.0, 2061419.0, 24321.0, 4691.0, 1664.0, 734.0, 347.0, 194.0, 121.0, 75.0, 38.0, 29.0, 22.0, 14.0, 19.0, 14.0, 15.0, 8.0, 6.0, 5.0, 4.0, 4.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-63.0, -61.14697265625, -59.2939453125, -57.44091796875, -55.587890625, -53.73486328125, -51.8818359375, -50.02880859375, -48.17578125, -46.32275390625, -44.4697265625, -42.61669921875, -40.763671875, -38.91064453125, -37.0576171875, -35.20458984375, -33.3515625, -31.49853515625, -29.6455078125, -27.79248046875, -25.939453125, -24.08642578125, -22.2333984375, -20.38037109375, -18.52734375, -16.67431640625, -14.8212890625, -12.96826171875, -11.115234375, -9.26220703125, -7.4091796875, -5.55615234375, -3.703125, -1.85009765625, 0.0029296875, 1.85595703125, 3.708984375, 5.56201171875, 7.4150390625, 9.26806640625, 11.12109375, 12.97412109375, 14.8271484375, 16.68017578125, 18.533203125, 20.38623046875, 22.2392578125, 24.09228515625, 25.9453125, 27.79833984375, 29.6513671875, 31.50439453125, 33.357421875, 35.21044921875, 37.0634765625, 38.91650390625, 40.76953125, 42.62255859375, 44.4755859375, 46.32861328125, 48.181640625, 50.03466796875, 51.8876953125, 53.74072265625, 55.59375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 13.0, 12.0, 7.0, 9.0, 15.0, 19.0, 21.0, 29.0, 44.0, 74.0, 95.0, 157.0, 309.0, 514.0, 716.0, 745.0, 502.0, 307.0, 169.0, 97.0, 56.0, 41.0, 28.0, 22.0, 7.0, 11.0, 12.0, 5.0, 7.0, 5.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.40625, -24.46484375, -23.5234375, -22.58203125, -21.640625, -20.69921875, -19.7578125, -18.81640625, -17.875, -16.93359375, -15.9921875, -15.05078125, -14.109375, -13.16796875, -12.2265625, -11.28515625, -10.34375, -9.40234375, -8.4609375, -7.51953125, -6.578125, -5.63671875, -4.6953125, -3.75390625, -2.8125, -1.87109375, -0.9296875, 0.01171875, 0.953125, 1.89453125, 2.8359375, 3.77734375, 4.71875, 5.66015625, 6.6015625, 7.54296875, 8.484375, 9.42578125, 10.3671875, 11.30859375, 12.25, 13.19140625, 14.1328125, 15.07421875, 16.015625, 16.95703125, 17.8984375, 18.83984375, 19.78125, 20.72265625, 21.6640625, 22.60546875, 23.546875, 24.48828125, 25.4296875, 26.37109375, 27.3125, 28.25390625, 29.1953125, 30.13671875, 31.078125, 32.01953125, 32.9609375, 33.90234375, 34.84375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 14.0, 9.0, 15.0, 16.0, 31.0, 45.0, 69.0, 128.0, 236.0, 632.0, 1859.0, 7446.0, 49378.0, 3875744.0, 238735.0, 14913.0, 3129.0, 1002.0, 379.0, 182.0, 104.0, 48.0, 42.0, 24.0, 22.0, 11.0, 10.0, 11.0, 12.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0], "bins": [-106.5625, -103.66015625, -100.7578125, -97.85546875, -94.953125, -92.05078125, -89.1484375, -86.24609375, -83.34375, -80.44140625, -77.5390625, -74.63671875, -71.734375, -68.83203125, -65.9296875, -63.02734375, -60.125, -57.22265625, -54.3203125, -51.41796875, -48.515625, -45.61328125, -42.7109375, -39.80859375, -36.90625, -34.00390625, -31.1015625, -28.19921875, -25.296875, -22.39453125, -19.4921875, -16.58984375, -13.6875, -10.78515625, -7.8828125, -4.98046875, -2.078125, 0.82421875, 3.7265625, 6.62890625, 9.53125, 12.43359375, 15.3359375, 18.23828125, 21.140625, 24.04296875, 26.9453125, 29.84765625, 32.75, 35.65234375, 38.5546875, 41.45703125, 44.359375, 47.26171875, 50.1640625, 53.06640625, 55.96875, 58.87109375, 61.7734375, 64.67578125, 67.578125, 70.48046875, 73.3828125, 76.28515625, 79.1875]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [6.0, 14.0, 23.0, 65.0, 258.0, 411.0, 186.0, 38.0, 10.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.839599609375, -54.55547332763672, -42.27134323120117, -29.987213134765625, -17.703086853027344, -5.4189605712890625, 6.86517333984375, 19.14929962158203, 31.433425903320312, 43.717552185058594, 56.00168228149414, 68.28581237792969, 80.56993865966797, 92.85406494140625, 105.13819885253906, 117.42232513427734, 129.70645141601562, 141.99058532714844, 154.2747039794922, 166.558837890625, 178.84295654296875, 191.12709045410156, 203.41122436523438, 215.69534301757812, 227.97947692871094, 240.26361083984375, 252.5477294921875, 264.83184814453125, 277.1159973144531, 289.4001159667969, 301.68426513671875, 313.9683837890625, 326.25250244140625, 338.53662109375, 350.8207702636719, 363.1048889160156, 375.3890075683594, 387.67315673828125, 399.957275390625, 412.24139404296875, 424.5255126953125, 436.80963134765625, 449.0937805175781, 461.3778991699219, 473.6620178222656, 485.9461669921875, 498.23028564453125, 510.514404296875, 522.798583984375, 535.0827026367188, 547.3668212890625, 559.6510009765625, 571.9351196289062, 584.21923828125, 596.5033569335938, 608.7874755859375, 621.0715942382812, 633.355712890625, 645.6398315429688, 657.9239501953125, 670.2081298828125, 682.4922485351562, 694.7763671875, 707.0604858398438, 719.3446044921875]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 6.0, 7.0, 14.0, 17.0, 14.0, 7.0, 22.0, 25.0, 28.0, 27.0, 32.0, 28.0, 33.0, 38.0, 33.0, 39.0, 39.0, 42.0, 43.0, 41.0, 30.0, 42.0, 35.0, 31.0, 45.0, 37.0, 32.0, 24.0, 26.0, 36.0, 19.0, 18.0, 21.0, 11.0, 12.0, 6.0, 15.0, 3.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-80.1352767944336, -77.53160095214844, -74.92791748046875, -72.3242416381836, -69.72056579589844, -67.11688232421875, -64.5132064819336, -61.90953063964844, -59.305850982666016, -56.702171325683594, -54.09849548339844, -51.494815826416016, -48.891136169433594, -46.28746032714844, -43.683780670166016, -41.080101013183594, -38.47642517089844, -35.872745513916016, -33.26906967163086, -30.665390014648438, -28.06171226501465, -25.45803451538086, -22.854354858398438, -20.25067710876465, -17.64699935913086, -15.04332160949707, -12.439642906188965, -9.83596420288086, -7.23228645324707, -4.628608703613281, -2.024930000305176, 0.5787487030029297, 3.1824188232421875, 5.786097049713135, 8.389775276184082, 10.993453979492188, 13.597131729125977, 16.200809478759766, 18.804489135742188, 21.408166885375977, 24.011844635009766, 26.615522384643555, 29.219200134277344, 31.822879791259766, 34.42655944824219, 37.030235290527344, 39.633914947509766, 42.23759460449219, 44.841270446777344, 47.444950103759766, 50.04862594604492, 52.652305603027344, 55.2559814453125, 57.85966110229492, 60.463340759277344, 63.0670166015625, 65.67070007324219, 68.27437591552734, 70.87805938720703, 73.48173522949219, 76.08541107177734, 78.6890869140625, 81.29277038574219, 83.89644622802734, 86.5001220703125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 5.0, 4.0, 13.0, 16.0, 7.0, 8.0, 23.0, 21.0, 29.0, 32.0, 21.0, 35.0, 38.0, 31.0, 40.0, 42.0, 41.0, 37.0, 44.0, 49.0, 43.0, 40.0, 45.0, 37.0, 38.0, 32.0, 26.0, 25.0, 23.0, 22.0, 26.0, 12.0, 17.0, 12.0, 13.0, 7.0, 7.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.30029296875, -12.8583984375, -12.41650390625, -11.974609375, -11.53271484375, -11.0908203125, -10.64892578125, -10.20703125, -9.76513671875, -9.3232421875, -8.88134765625, -8.439453125, -7.99755859375, -7.5556640625, -7.11376953125, -6.671875, -6.22998046875, -5.7880859375, -5.34619140625, -4.904296875, -4.46240234375, -4.0205078125, -3.57861328125, -3.13671875, -2.69482421875, -2.2529296875, -1.81103515625, -1.369140625, -0.92724609375, -0.4853515625, -0.04345703125, 0.3984375, 0.84033203125, 1.2822265625, 1.72412109375, 2.166015625, 2.60791015625, 3.0498046875, 3.49169921875, 3.93359375, 4.37548828125, 4.8173828125, 5.25927734375, 5.701171875, 6.14306640625, 6.5849609375, 7.02685546875, 7.46875, 7.91064453125, 8.3525390625, 8.79443359375, 9.236328125, 9.67822265625, 10.1201171875, 10.56201171875, 11.00390625, 11.44580078125, 11.8876953125, 12.32958984375, 12.771484375, 13.21337890625, 13.6552734375, 14.09716796875, 14.5390625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 7.0, 12.0, 19.0, 29.0, 29.0, 58.0, 89.0, 116.0, 169.0, 288.0, 365.0, 620.0, 1034.0, 1564.0, 2381.0, 3871.0, 5988.0, 9861.0, 16530.0, 27846.0, 46916.0, 82861.0, 156712.0, 266085.0, 190054.0, 98667.0, 54888.0, 32001.0, 19134.0, 11380.0, 6953.0, 4359.0, 2798.0, 1670.0, 1130.0, 723.0, 432.0, 284.0, 208.0, 146.0, 90.0, 58.0, 39.0, 22.0, 26.0, 21.0, 10.0, 4.0, 4.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-1.37109375, -1.3303375244140625, -1.289581298828125, -1.2488250732421875, -1.20806884765625, -1.1673126220703125, -1.126556396484375, -1.0858001708984375, -1.0450439453125, -1.0042877197265625, -0.963531494140625, -0.9227752685546875, -0.88201904296875, -0.8412628173828125, -0.800506591796875, -0.7597503662109375, -0.718994140625, -0.6782379150390625, -0.637481689453125, -0.5967254638671875, -0.55596923828125, -0.5152130126953125, -0.474456787109375, -0.4337005615234375, -0.3929443359375, -0.3521881103515625, -0.311431884765625, -0.2706756591796875, -0.22991943359375, -0.1891632080078125, -0.148406982421875, -0.1076507568359375, -0.06689453125, -0.0261383056640625, 0.014617919921875, 0.0553741455078125, 0.09613037109375, 0.1368865966796875, 0.177642822265625, 0.2183990478515625, 0.2591552734375, 0.2999114990234375, 0.340667724609375, 0.3814239501953125, 0.42218017578125, 0.4629364013671875, 0.503692626953125, 0.5444488525390625, 0.585205078125, 0.6259613037109375, 0.666717529296875, 0.7074737548828125, 0.74822998046875, 0.7889862060546875, 0.829742431640625, 0.8704986572265625, 0.9112548828125, 0.9520111083984375, 0.992767333984375, 1.0335235595703125, 1.07427978515625, 1.1150360107421875, 1.155792236328125, 1.1965484619140625, 1.2373046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 7.0, 11.0, 13.0, 13.0, 14.0, 10.0, 21.0, 22.0, 19.0, 14.0, 36.0, 29.0, 40.0, 39.0, 49.0, 43.0, 42.0, 35.0, 47.0, 1068.0, 33.0, 42.0, 34.0, 38.0, 50.0, 31.0, 40.0, 27.0, 23.0, 25.0, 25.0, 17.0, 9.0, 16.0, 11.0, 6.0, 8.0, 8.0, 6.0, 4.0, 8.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.046875, -9.7447509765625, -9.442626953125, -9.1405029296875, -8.83837890625, -8.5362548828125, -8.234130859375, -7.9320068359375, -7.6298828125, -7.3277587890625, -7.025634765625, -6.7235107421875, -6.42138671875, -6.1192626953125, -5.817138671875, -5.5150146484375, -5.212890625, -4.9107666015625, -4.608642578125, -4.3065185546875, -4.00439453125, -3.7022705078125, -3.400146484375, -3.0980224609375, -2.7958984375, -2.4937744140625, -2.191650390625, -1.8895263671875, -1.58740234375, -1.2852783203125, -0.983154296875, -0.6810302734375, -0.37890625, -0.0767822265625, 0.225341796875, 0.5274658203125, 0.82958984375, 1.1317138671875, 1.433837890625, 1.7359619140625, 2.0380859375, 2.3402099609375, 2.642333984375, 2.9444580078125, 3.24658203125, 3.5487060546875, 3.850830078125, 4.1529541015625, 4.455078125, 4.7572021484375, 5.059326171875, 5.3614501953125, 5.66357421875, 5.9656982421875, 6.267822265625, 6.5699462890625, 6.8720703125, 7.1741943359375, 7.476318359375, 7.7784423828125, 8.08056640625, 8.3826904296875, 8.684814453125, 8.9869384765625, 9.2890625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 3.0, 5.0, 10.0, 7.0, 7.0, 14.0, 26.0, 42.0, 45.0, 68.0, 118.0, 164.0, 268.0, 377.0, 629.0, 1022.0, 1728.0, 2806.0, 4672.0, 8257.0, 14206.0, 25548.0, 47380.0, 90780.0, 195337.0, 1358395.0, 168813.0, 79937.0, 42343.0, 22985.0, 12773.0, 7272.0, 4375.0, 2522.0, 1584.0, 939.0, 575.0, 403.0, 231.0, 145.0, 108.0, 70.0, 50.0, 34.0, 25.0, 14.0, 10.0, 5.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5283203125, -1.482574462890625, -1.43682861328125, -1.391082763671875, -1.3453369140625, -1.299591064453125, -1.25384521484375, -1.208099365234375, -1.162353515625, -1.116607666015625, -1.07086181640625, -1.025115966796875, -0.9793701171875, -0.933624267578125, -0.88787841796875, -0.842132568359375, -0.79638671875, -0.750640869140625, -0.70489501953125, -0.659149169921875, -0.6134033203125, -0.567657470703125, -0.52191162109375, -0.476165771484375, -0.430419921875, -0.384674072265625, -0.33892822265625, -0.293182373046875, -0.2474365234375, -0.201690673828125, -0.15594482421875, -0.110198974609375, -0.064453125, -0.018707275390625, 0.02703857421875, 0.072784423828125, 0.1185302734375, 0.164276123046875, 0.21002197265625, 0.255767822265625, 0.301513671875, 0.347259521484375, 0.39300537109375, 0.438751220703125, 0.4844970703125, 0.530242919921875, 0.57598876953125, 0.621734619140625, 0.66748046875, 0.713226318359375, 0.75897216796875, 0.804718017578125, 0.8504638671875, 0.896209716796875, 0.94195556640625, 0.987701416015625, 1.033447265625, 1.079193115234375, 1.12493896484375, 1.170684814453125, 1.2164306640625, 1.262176513671875, 1.30792236328125, 1.353668212890625, 1.3994140625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 8.0, 8.0, 10.0, 2.0, 8.0, 14.0, 13.0, 14.0, 24.0, 23.0, 26.0, 33.0, 36.0, 34.0, 35.0, 43.0, 41.0, 53.0, 36.0, 60.0, 45.0, 55.0, 40.0, 36.0, 31.0, 31.0, 32.0, 27.0, 32.0, 19.0, 19.0, 18.0, 24.0, 9.0, 18.0, 8.0, 7.0, 12.0, 5.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0026988983154296875, -0.0026126205921173096, -0.0025263428688049316, -0.0024400651454925537, -0.0023537874221801758, -0.002267509698867798, -0.00218123197555542, -0.002094954252243042, -0.002008676528930664, -0.0019223988056182861, -0.0018361210823059082, -0.0017498433589935303, -0.0016635656356811523, -0.0015772879123687744, -0.0014910101890563965, -0.0014047324657440186, -0.0013184547424316406, -0.0012321770191192627, -0.0011458992958068848, -0.0010596215724945068, -0.0009733438491821289, -0.000887066125869751, -0.000800788402557373, -0.0007145106792449951, -0.0006282329559326172, -0.0005419552326202393, -0.00045567750930786133, -0.0003693997859954834, -0.00028312206268310547, -0.00019684433937072754, -0.00011056661605834961, -2.428889274597168e-05, 6.198883056640625e-05, 0.00014826655387878418, 0.0002345442771911621, 0.00032082200050354004, 0.00040709972381591797, 0.0004933774471282959, 0.0005796551704406738, 0.0006659328937530518, 0.0007522106170654297, 0.0008384883403778076, 0.0009247660636901855, 0.0010110437870025635, 0.0010973215103149414, 0.0011835992336273193, 0.0012698769569396973, 0.0013561546802520752, 0.0014424324035644531, 0.001528710126876831, 0.001614987850189209, 0.001701265573501587, 0.0017875432968139648, 0.0018738210201263428, 0.0019600987434387207, 0.0020463764667510986, 0.0021326541900634766, 0.0022189319133758545, 0.0023052096366882324, 0.0023914873600006104, 0.0024777650833129883, 0.002564042806625366, 0.002650320529937744, 0.002736598253250122, 0.0028228759765625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 5.0, 8.0, 4.0, 9.0, 13.0, 14.0, 14.0, 21.0, 29.0, 35.0, 40.0, 54.0, 49.0, 71.0, 85.0, 157.0, 274.0, 796.0, 14878.0, 957410.0, 72021.0, 1414.0, 397.0, 172.0, 139.0, 100.0, 66.0, 58.0, 44.0, 37.0, 31.0, 19.0, 17.0, 17.0, 17.0, 4.0, 8.0, 8.0, 9.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0606689453125, -0.058811187744140625, -0.05695343017578125, -0.055095672607421875, -0.0532379150390625, -0.051380157470703125, -0.04952239990234375, -0.047664642333984375, -0.045806884765625, -0.043949127197265625, -0.04209136962890625, -0.040233612060546875, -0.0383758544921875, -0.036518096923828125, -0.03466033935546875, -0.032802581787109375, -0.03094482421875, -0.029087066650390625, -0.02722930908203125, -0.025371551513671875, -0.0235137939453125, -0.021656036376953125, -0.01979827880859375, -0.017940521240234375, -0.016082763671875, -0.014225006103515625, -0.01236724853515625, -0.010509490966796875, -0.0086517333984375, -0.006793975830078125, -0.00493621826171875, -0.003078460693359375, -0.001220703125, 0.000637054443359375, 0.00249481201171875, 0.004352569580078125, 0.0062103271484375, 0.008068084716796875, 0.00992584228515625, 0.011783599853515625, 0.013641357421875, 0.015499114990234375, 0.01735687255859375, 0.019214630126953125, 0.0210723876953125, 0.022930145263671875, 0.02478790283203125, 0.026645660400390625, 0.02850341796875, 0.030361175537109375, 0.03221893310546875, 0.034076690673828125, 0.0359344482421875, 0.037792205810546875, 0.03964996337890625, 0.041507720947265625, 0.043365478515625, 0.045223236083984375, 0.04708099365234375, 0.048938751220703125, 0.0507965087890625, 0.052654266357421875, 0.05451202392578125, 0.056369781494140625, 0.0582275390625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 8.0, 11.0, 10.0, 23.0, 36.0, 53.0, 70.0, 120.0, 121.0, 161.0, 124.0, 78.0, 67.0, 46.0, 34.0, 10.0, 8.0, 7.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001576072652824223, -0.0014942854177206755, -0.001412498182617128, -0.0013307109475135803, -0.001248923595994711, -0.0011671363608911633, -0.0010853491257876158, -0.0010035617742687464, -0.0009217745973728597, -0.0008399873622693121, -0.0007582000689581037, -0.0006764128338545561, -0.0005946255987510085, -0.0005128383054398, -0.00043105107033625245, -0.00034926377702504396, -0.0002674765419214964, -0.00018568927771411836, -0.00010390202805865556, -2.211477840319276e-05, 5.967248580418527e-05, 0.0001414597500115633, 0.00022324698511511087, 0.00030503427842631936, 0.00038682151352986693, 0.00046860877773724496, 0.000550396041944623, 0.0006321832770481706, 0.0007139705121517181, 0.0007957578054629266, 0.0008775450405664742, 0.0009593323338776827, 0.001041119685396552, 0.0011229069205000997, 0.0012046941556036472, 0.0012864815071225166, 0.0013682687422260642, 0.0014500559773296118, 0.0015318432124331594, 0.001613630447536707, 0.0016954177990555763, 0.001777205034159124, 0.0018589922692626715, 0.0019407796207815409, 0.0020225667394697666, 0.002104354090988636, 0.0021861414425075054, 0.002267928561195731, 0.002349715679883957, 0.0024315030314028263, 0.002513290150091052, 0.0025950775016099215, 0.002676864620298147, 0.0027586519718170166, 0.002840439323335886, 0.0029222264420241117, 0.003004013793542981, 0.0030858011450618505, 0.0031675882637500763, 0.0032493756152689457, 0.0033311627339571714, 0.003412950085476041, 0.0034947372041642666, 0.003576524555683136, 0.0036583119072020054]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 2.0, 6.0, 2.0, 8.0, 9.0, 14.0, 12.0, 16.0, 17.0, 15.0, 33.0, 36.0, 28.0, 43.0, 33.0, 39.0, 45.0, 32.0, 48.0, 37.0, 45.0, 34.0, 56.0, 38.0, 44.0, 27.0, 36.0, 28.0, 37.0, 24.0, 26.0, 23.0, 15.0, 17.0, 19.0, 11.0, 4.0, 12.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002001047134399414, -0.0019459407776594162, -0.0018908344209194183, -0.0018357280641794205, -0.0017806217074394226, -0.0017255153506994247, -0.0016704089939594269, -0.001615302637219429, -0.0015601962804794312, -0.0015050899237394333, -0.0014499835669994354, -0.0013948772102594376, -0.0013397708535194397, -0.0012846644967794418, -0.001229558140039444, -0.001174451783299446, -0.0011193454265594482, -0.0010642390698194504, -0.0010091327130794525, -0.0009540263563394547, -0.0008989199995994568, -0.0008438136428594589, -0.0007887072861194611, -0.0007336009293794632, -0.0006784945726394653, -0.0006233882158994675, -0.0005682818591594696, -0.0005131755024194717, -0.0004580691456794739, -0.000402962788939476, -0.00034785643219947815, -0.0002927500754594803, -0.00023764371871948242, -0.00018253736197948456, -0.0001274310052394867, -7.232464849948883e-05, -1.7218291759490967e-05, 3.78880649805069e-05, 9.299442172050476e-05, 0.00014810077846050262, 0.0002032071352005005, 0.00025831349194049835, 0.0003134198486804962, 0.0003685262054204941, 0.00042363256216049194, 0.0004787389189004898, 0.0005338452756404877, 0.0005889516323804855, 0.0006440579891204834, 0.0006991643458604813, 0.0007542707026004791, 0.000809377059340477, 0.0008644834160804749, 0.0009195897728204727, 0.0009746961295604706, 0.0010298024863004684, 0.0010849088430404663, 0.0011400151997804642, 0.001195121556520462, 0.00125022791326046, 0.0013053342700004578, 0.0013604406267404556, 0.0014155469834804535, 0.0014706533402204514, 0.0015257596969604492]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 6.0, 5.0, 5.0, 4.0, 13.0, 16.0, 7.0, 8.0, 23.0, 21.0, 29.0, 32.0, 21.0, 35.0, 38.0, 31.0, 40.0, 42.0, 41.0, 37.0, 44.0, 49.0, 43.0, 40.0, 45.0, 37.0, 38.0, 32.0, 26.0, 25.0, 23.0, 22.0, 26.0, 12.0, 17.0, 12.0, 13.0, 7.0, 7.0, 8.0, 6.0, 5.0, 7.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.7421875, -13.30029296875, -12.8583984375, -12.41650390625, -11.974609375, -11.53271484375, -11.0908203125, -10.64892578125, -10.20703125, -9.76513671875, -9.3232421875, -8.88134765625, -8.439453125, -7.99755859375, -7.5556640625, -7.11376953125, -6.671875, -6.22998046875, -5.7880859375, -5.34619140625, -4.904296875, -4.46240234375, -4.0205078125, -3.57861328125, -3.13671875, -2.69482421875, -2.2529296875, -1.81103515625, -1.369140625, -0.92724609375, -0.4853515625, -0.04345703125, 0.3984375, 0.84033203125, 1.2822265625, 1.72412109375, 2.166015625, 2.60791015625, 3.0498046875, 3.49169921875, 3.93359375, 4.37548828125, 4.8173828125, 5.25927734375, 5.701171875, 6.14306640625, 6.5849609375, 7.02685546875, 7.46875, 7.91064453125, 8.3525390625, 8.79443359375, 9.236328125, 9.67822265625, 10.1201171875, 10.56201171875, 11.00390625, 11.44580078125, 11.8876953125, 12.32958984375, 12.771484375, 13.21337890625, 13.6552734375, 14.09716796875, 14.5390625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 5.0, 4.0, 2.0, 13.0, 16.0, 18.0, 29.0, 18.0, 34.0, 66.0, 69.0, 87.0, 113.0, 131.0, 191.0, 250.0, 301.0, 464.0, 567.0, 768.0, 989.0, 1357.0, 2004.0, 3013.0, 4940.0, 9164.0, 20063.0, 63861.0, 335845.0, 467463.0, 85171.0, 24265.0, 10300.0, 5472.0, 3442.0, 2212.0, 1514.0, 1130.0, 787.0, 520.0, 428.0, 333.0, 237.0, 219.0, 149.0, 145.0, 95.0, 82.0, 55.0, 36.0, 34.0, 26.0, 24.0, 27.0, 9.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-10.1484375, -9.832275390625, -9.51611328125, -9.199951171875, -8.8837890625, -8.567626953125, -8.25146484375, -7.935302734375, -7.619140625, -7.302978515625, -6.98681640625, -6.670654296875, -6.3544921875, -6.038330078125, -5.72216796875, -5.406005859375, -5.08984375, -4.773681640625, -4.45751953125, -4.141357421875, -3.8251953125, -3.509033203125, -3.19287109375, -2.876708984375, -2.560546875, -2.244384765625, -1.92822265625, -1.612060546875, -1.2958984375, -0.979736328125, -0.66357421875, -0.347412109375, -0.03125, 0.284912109375, 0.60107421875, 0.917236328125, 1.2333984375, 1.549560546875, 1.86572265625, 2.181884765625, 2.498046875, 2.814208984375, 3.13037109375, 3.446533203125, 3.7626953125, 4.078857421875, 4.39501953125, 4.711181640625, 5.02734375, 5.343505859375, 5.65966796875, 5.975830078125, 6.2919921875, 6.608154296875, 6.92431640625, 7.240478515625, 7.556640625, 7.872802734375, 8.18896484375, 8.505126953125, 8.8212890625, 9.137451171875, 9.45361328125, 9.769775390625, 10.0859375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 1.0, 3.0, 7.0, 4.0, 10.0, 7.0, 4.0, 9.0, 18.0, 9.0, 19.0, 18.0, 21.0, 30.0, 45.0, 37.0, 37.0, 59.0, 61.0, 62.0, 74.0, 1599.0, 399.0, 73.0, 61.0, 60.0, 49.0, 36.0, 41.0, 23.0, 22.0, 34.0, 14.0, 17.0, 14.0, 12.0, 9.0, 16.0, 8.0, 6.0, 7.0, 5.0, 4.0, 2.0, 1.0, 2.0, 2.0, 5.0, 1.0], "bins": [-55.90625, -54.3935546875, -52.880859375, -51.3681640625, -49.85546875, -48.3427734375, -46.830078125, -45.3173828125, -43.8046875, -42.2919921875, -40.779296875, -39.2666015625, -37.75390625, -36.2412109375, -34.728515625, -33.2158203125, -31.703125, -30.1904296875, -28.677734375, -27.1650390625, -25.65234375, -24.1396484375, -22.626953125, -21.1142578125, -19.6015625, -18.0888671875, -16.576171875, -15.0634765625, -13.55078125, -12.0380859375, -10.525390625, -9.0126953125, -7.5, -5.9873046875, -4.474609375, -2.9619140625, -1.44921875, 0.0634765625, 1.576171875, 3.0888671875, 4.6015625, 6.1142578125, 7.626953125, 9.1396484375, 10.65234375, 12.1650390625, 13.677734375, 15.1904296875, 16.703125, 18.2158203125, 19.728515625, 21.2412109375, 22.75390625, 24.2666015625, 25.779296875, 27.2919921875, 28.8046875, 30.3173828125, 31.830078125, 33.3427734375, 34.85546875, 36.3681640625, 37.880859375, 39.3935546875, 40.90625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 18.0, 14.0, 30.0, 65.0, 102.0, 192.0, 494.0, 5356.0, 3135124.0, 3448.0, 450.0, 191.0, 94.0, 56.0, 33.0, 14.0, 6.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-294.75, -285.06640625, -275.3828125, -265.69921875, -256.015625, -246.33203125, -236.6484375, -226.96484375, -217.28125, -207.59765625, -197.9140625, -188.23046875, -178.546875, -168.86328125, -159.1796875, -149.49609375, -139.8125, -130.12890625, -120.4453125, -110.76171875, -101.078125, -91.39453125, -81.7109375, -72.02734375, -62.34375, -52.66015625, -42.9765625, -33.29296875, -23.609375, -13.92578125, -4.2421875, 5.44140625, 15.125, 24.80859375, 34.4921875, 44.17578125, 53.859375, 63.54296875, 73.2265625, 82.91015625, 92.59375, 102.27734375, 111.9609375, 121.64453125, 131.328125, 141.01171875, 150.6953125, 160.37890625, 170.0625, 179.74609375, 189.4296875, 199.11328125, 208.796875, 218.48046875, 228.1640625, 237.84765625, 247.53125, 257.21484375, 266.8984375, 276.58203125, 286.265625, 295.94921875, 305.6328125, 315.31640625, 325.0]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 698.0, 313.0, 3.0, 2.0, 1.0], "bins": [-1483.9656982421875, -1459.193603515625, -1434.42138671875, -1409.6492919921875, -1384.8770751953125, -1360.10498046875, -1335.3328857421875, -1310.5606689453125, -1285.78857421875, -1261.0164794921875, -1236.2442626953125, -1211.47216796875, -1186.699951171875, -1161.9278564453125, -1137.15576171875, -1112.383544921875, -1087.6114501953125, -1062.83935546875, -1038.067138671875, -1013.2950439453125, -988.5228881835938, -963.750732421875, -938.9785766601562, -914.2064208984375, -889.4342651367188, -864.662109375, -839.8899536132812, -815.1178588867188, -790.345703125, -765.5735473632812, -740.8013916015625, -716.029296875, -691.257080078125, -666.4849243164062, -641.7127685546875, -616.940673828125, -592.1685180664062, -567.3963623046875, -542.6242065429688, -517.85205078125, -493.0799560546875, -468.30780029296875, -443.5356750488281, -418.7635192871094, -393.99139404296875, -369.21923828125, -344.44708251953125, -319.6749572753906, -294.90283203125, -270.13067626953125, -245.35855102539062, -220.58639526367188, -195.81427001953125, -171.0421142578125, -146.2699737548828, -121.49783325195312, -96.72569274902344, -71.95355224609375, -47.1814079284668, -22.409263610839844, 2.3628768920898438, 27.13501739501953, 51.90716552734375, 76.67930603027344, 101.45144653320312]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 0.0, 5.0, 7.0, 11.0, 11.0, 15.0, 13.0, 14.0, 20.0, 20.0, 27.0, 27.0, 25.0, 25.0, 29.0, 30.0, 24.0, 40.0, 37.0, 40.0, 36.0, 43.0, 35.0, 40.0, 40.0, 36.0, 27.0, 40.0, 33.0, 28.0, 39.0, 29.0, 22.0, 24.0, 18.0, 9.0, 14.0, 11.0, 14.0, 9.0, 8.0, 6.0, 2.0, 5.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-116.2413330078125, -112.45997619628906, -108.67862701416016, -104.89727020263672, -101.11591339111328, -97.33456420898438, -93.55320739746094, -89.7718505859375, -85.99049377441406, -82.20913696289062, -78.42778778076172, -74.64643096923828, -70.86507415771484, -67.08372497558594, -63.3023681640625, -59.52101135253906, -55.739662170410156, -51.958309173583984, -48.17695236206055, -44.395599365234375, -40.61424255371094, -36.832889556884766, -33.051536560058594, -29.27018165588379, -25.488826751708984, -21.70747184753418, -17.926116943359375, -14.144763946533203, -10.363409042358398, -6.582054138183594, -2.800701141357422, 0.9806537628173828, 4.7620086669921875, 8.543363571166992, 12.32471752166748, 16.10607147216797, 19.887426376342773, 23.668781280517578, 27.45013427734375, 31.231489181518555, 35.01284408569336, 38.79419708251953, 42.57555389404297, 46.35690689086914, 50.13825988769531, 53.91961669921875, 57.70096969604492, 61.482322692871094, 65.26367950439453, 69.04503631591797, 72.82638549804688, 76.60774230957031, 80.38909912109375, 84.17045593261719, 87.9518051147461, 91.73316192626953, 95.51451110839844, 99.29586791992188, 103.07721710205078, 106.85857391357422, 110.63993072509766, 114.42127990722656, 118.20263671875, 121.98399353027344, 125.76535034179688]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 9.0, 9.0, 6.0, 5.0, 15.0, 12.0, 16.0, 20.0, 26.0, 27.0, 22.0, 36.0, 25.0, 32.0, 34.0, 46.0, 33.0, 48.0, 41.0, 41.0, 58.0, 37.0, 43.0, 45.0, 34.0, 41.0, 24.0, 19.0, 23.0, 31.0, 23.0, 17.0, 16.0, 9.0, 12.0, 18.0, 7.0, 10.0, 6.0, 10.0, 2.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.875, -14.40771484375, -13.9404296875, -13.47314453125, -13.005859375, -12.53857421875, -12.0712890625, -11.60400390625, -11.13671875, -10.66943359375, -10.2021484375, -9.73486328125, -9.267578125, -8.80029296875, -8.3330078125, -7.86572265625, -7.3984375, -6.93115234375, -6.4638671875, -5.99658203125, -5.529296875, -5.06201171875, -4.5947265625, -4.12744140625, -3.66015625, -3.19287109375, -2.7255859375, -2.25830078125, -1.791015625, -1.32373046875, -0.8564453125, -0.38916015625, 0.078125, 0.54541015625, 1.0126953125, 1.47998046875, 1.947265625, 2.41455078125, 2.8818359375, 3.34912109375, 3.81640625, 4.28369140625, 4.7509765625, 5.21826171875, 5.685546875, 6.15283203125, 6.6201171875, 7.08740234375, 7.5546875, 8.02197265625, 8.4892578125, 8.95654296875, 9.423828125, 9.89111328125, 10.3583984375, 10.82568359375, 11.29296875, 11.76025390625, 12.2275390625, 12.69482421875, 13.162109375, 13.62939453125, 14.0966796875, 14.56396484375, 15.03125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 8.0, 11.0, 12.0, 9.0, 24.0, 31.0, 29.0, 42.0, 74.0, 115.0, 177.0, 368.0, 667.0, 1481.0, 3067.0, 7369.0, 57033.0, 2005084.0, 2054508.0, 49853.0, 7669.0, 3068.0, 1599.0, 852.0, 481.0, 257.0, 134.0, 64.0, 46.0, 21.0, 16.0, 14.0, 15.0, 16.0, 9.0, 7.0, 8.0, 6.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-45.75, -44.3203125, -42.890625, -41.4609375, -40.03125, -38.6015625, -37.171875, -35.7421875, -34.3125, -32.8828125, -31.453125, -30.0234375, -28.59375, -27.1640625, -25.734375, -24.3046875, -22.875, -21.4453125, -20.015625, -18.5859375, -17.15625, -15.7265625, -14.296875, -12.8671875, -11.4375, -10.0078125, -8.578125, -7.1484375, -5.71875, -4.2890625, -2.859375, -1.4296875, 0.0, 1.4296875, 2.859375, 4.2890625, 5.71875, 7.1484375, 8.578125, 10.0078125, 11.4375, 12.8671875, 14.296875, 15.7265625, 17.15625, 18.5859375, 20.015625, 21.4453125, 22.875, 24.3046875, 25.734375, 27.1640625, 28.59375, 30.0234375, 31.453125, 32.8828125, 34.3125, 35.7421875, 37.171875, 38.6015625, 40.03125, 41.4609375, 42.890625, 44.3203125, 45.75]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 7.0, 7.0, 10.0, 6.0, 16.0, 17.0, 21.0, 35.0, 66.0, 141.0, 249.0, 614.0, 995.0, 941.0, 458.0, 214.0, 108.0, 47.0, 40.0, 26.0, 21.0, 7.0, 7.0, 6.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.0625, -49.67724609375, -48.2919921875, -46.90673828125, -45.521484375, -44.13623046875, -42.7509765625, -41.36572265625, -39.98046875, -38.59521484375, -37.2099609375, -35.82470703125, -34.439453125, -33.05419921875, -31.6689453125, -30.28369140625, -28.8984375, -27.51318359375, -26.1279296875, -24.74267578125, -23.357421875, -21.97216796875, -20.5869140625, -19.20166015625, -17.81640625, -16.43115234375, -15.0458984375, -13.66064453125, -12.275390625, -10.89013671875, -9.5048828125, -8.11962890625, -6.734375, -5.34912109375, -3.9638671875, -2.57861328125, -1.193359375, 0.19189453125, 1.5771484375, 2.96240234375, 4.34765625, 5.73291015625, 7.1181640625, 8.50341796875, 9.888671875, 11.27392578125, 12.6591796875, 14.04443359375, 15.4296875, 16.81494140625, 18.2001953125, 19.58544921875, 20.970703125, 22.35595703125, 23.7412109375, 25.12646484375, 26.51171875, 27.89697265625, 29.2822265625, 30.66748046875, 32.052734375, 33.43798828125, 34.8232421875, 36.20849609375, 37.59375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 12.0, 21.0, 32.0, 76.0, 127.0, 232.0, 512.0, 1453.0, 8804.0, 202624.0, 3949079.0, 26727.0, 3080.0, 753.0, 359.0, 151.0, 86.0, 53.0, 26.0, 14.0, 11.0, 10.0, 8.0, 7.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-113.25, -109.091796875, -104.93359375, -100.775390625, -96.6171875, -92.458984375, -88.30078125, -84.142578125, -79.984375, -75.826171875, -71.66796875, -67.509765625, -63.3515625, -59.193359375, -55.03515625, -50.876953125, -46.71875, -42.560546875, -38.40234375, -34.244140625, -30.0859375, -25.927734375, -21.76953125, -17.611328125, -13.453125, -9.294921875, -5.13671875, -0.978515625, 3.1796875, 7.337890625, 11.49609375, 15.654296875, 19.8125, 23.970703125, 28.12890625, 32.287109375, 36.4453125, 40.603515625, 44.76171875, 48.919921875, 53.078125, 57.236328125, 61.39453125, 65.552734375, 69.7109375, 73.869140625, 78.02734375, 82.185546875, 86.34375, 90.501953125, 94.66015625, 98.818359375, 102.9765625, 107.134765625, 111.29296875, 115.451171875, 119.609375, 123.767578125, 127.92578125, 132.083984375, 136.2421875, 140.400390625, 144.55859375, 148.716796875, 152.875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 10.0, 18.0, 39.0, 86.0, 220.0, 361.0, 183.0, 61.0, 24.0, 9.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-196.1596221923828, -186.03109741210938, -175.90257263183594, -165.7740478515625, -155.64553833007812, -145.5170135498047, -135.38848876953125, -125.25997161865234, -115.1314468383789, -105.00292205810547, -94.87440490722656, -84.74588012695312, -74.61735534667969, -64.48883819580078, -54.360313415527344, -44.23179626464844, -34.103271484375, -23.974750518798828, -13.846227645874023, -3.7177047729492188, 6.410816192626953, 16.539337158203125, 26.667861938476562, 36.79637908935547, 46.924903869628906, 57.05342483520508, 67.18194580078125, 77.31047058105469, 87.43899536132812, 97.56751251220703, 107.69603729248047, 117.82455444335938, 127.95306396484375, 138.0815887451172, 148.21011352539062, 158.338623046875, 168.46714782714844, 178.59567260742188, 188.7241973876953, 198.85272216796875, 208.98123168945312, 219.10975646972656, 229.23828125, 239.36679077148438, 249.4953155517578, 259.62384033203125, 269.75238037109375, 279.8808898925781, 290.0093994140625, 300.1379089355469, 310.2664489746094, 320.39495849609375, 330.52349853515625, 340.6520080566406, 350.780517578125, 360.9090576171875, 371.03759765625, 381.1661071777344, 391.2946472167969, 401.42315673828125, 411.55169677734375, 421.6802062988281, 431.8087158203125, 441.937255859375, 452.0657653808594]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 5.0, 5.0, 6.0, 8.0, 6.0, 6.0, 6.0, 13.0, 14.0, 20.0, 22.0, 22.0, 28.0, 24.0, 33.0, 35.0, 23.0, 35.0, 43.0, 39.0, 31.0, 38.0, 38.0, 45.0, 45.0, 38.0, 43.0, 36.0, 30.0, 34.0, 27.0, 26.0, 26.0, 25.0, 22.0, 15.0, 14.0, 17.0, 14.0, 7.0, 9.0, 7.0, 6.0, 5.0, 2.0, 5.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-75.58731842041016, -72.9395523071289, -70.29179382324219, -67.64402770996094, -64.99626159667969, -62.34849548339844, -59.70073318481445, -57.05297088623047, -54.40520477294922, -51.75743865966797, -49.109676361083984, -46.4619140625, -43.81414794921875, -41.1663818359375, -38.518619537353516, -35.87085723876953, -33.22309112548828, -30.575326919555664, -27.927562713623047, -25.27979850769043, -22.632034301757812, -19.984270095825195, -17.336505889892578, -14.688741683959961, -12.040977478027344, -9.393213272094727, -6.745449066162109, -4.097684860229492, -1.449920654296875, 1.1978435516357422, 3.8456077575683594, 6.493371963500977, 9.141128540039062, 11.78889274597168, 14.436656951904297, 17.084421157836914, 19.73218536376953, 22.37994956970215, 25.027713775634766, 27.675477981567383, 30.3232421875, 32.97100830078125, 35.618770599365234, 38.26653289794922, 40.91429901123047, 43.56206512451172, 46.2098274230957, 48.85758972167969, 51.50535583496094, 54.15312194824219, 56.80088424682617, 59.448646545410156, 62.096412658691406, 64.74417877197266, 67.39193725585938, 70.03970336914062, 72.68746948242188, 75.33523559570312, 77.98300170898438, 80.6307601928711, 83.27852630615234, 85.9262924194336, 88.57405090332031, 91.22181701660156, 93.86958312988281]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 7.0, 10.0, 7.0, 7.0, 17.0, 13.0, 18.0, 14.0, 27.0, 16.0, 34.0, 31.0, 37.0, 41.0, 41.0, 31.0, 36.0, 45.0, 37.0, 36.0, 46.0, 39.0, 36.0, 50.0, 24.0, 30.0, 29.0, 27.0, 23.0, 27.0, 18.0, 24.0, 19.0, 11.0, 15.0, 14.0, 10.0, 9.0, 5.0, 5.0, 3.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.953125, -14.5069580078125, -14.060791015625, -13.6146240234375, -13.16845703125, -12.7222900390625, -12.276123046875, -11.8299560546875, -11.3837890625, -10.9376220703125, -10.491455078125, -10.0452880859375, -9.59912109375, -9.1529541015625, -8.706787109375, -8.2606201171875, -7.814453125, -7.3682861328125, -6.922119140625, -6.4759521484375, -6.02978515625, -5.5836181640625, -5.137451171875, -4.6912841796875, -4.2451171875, -3.7989501953125, -3.352783203125, -2.9066162109375, -2.46044921875, -2.0142822265625, -1.568115234375, -1.1219482421875, -0.67578125, -0.2296142578125, 0.216552734375, 0.6627197265625, 1.10888671875, 1.5550537109375, 2.001220703125, 2.4473876953125, 2.8935546875, 3.3397216796875, 3.785888671875, 4.2320556640625, 4.67822265625, 5.1243896484375, 5.570556640625, 6.0167236328125, 6.462890625, 6.9090576171875, 7.355224609375, 7.8013916015625, 8.24755859375, 8.6937255859375, 9.139892578125, 9.5860595703125, 10.0322265625, 10.4783935546875, 10.924560546875, 11.3707275390625, 11.81689453125, 12.2630615234375, 12.709228515625, 13.1553955078125, 13.6015625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 4.0, 15.0, 15.0, 25.0, 41.0, 61.0, 74.0, 107.0, 161.0, 261.0, 391.0, 631.0, 855.0, 1233.0, 1962.0, 2637.0, 3933.0, 5684.0, 8863.0, 13152.0, 19737.0, 30164.0, 47015.0, 75360.0, 127033.0, 208612.0, 193021.0, 113718.0, 68174.0, 42843.0, 27621.0, 18061.0, 11991.0, 8097.0, 5238.0, 3773.0, 2447.0, 1834.0, 1221.0, 832.0, 495.0, 364.0, 274.0, 185.0, 127.0, 67.0, 53.0, 36.0, 26.0, 12.0, 8.0, 6.0, 2.0, 4.0, 2.0], "bins": [-1.28125, -1.244537353515625, -1.20782470703125, -1.171112060546875, -1.1343994140625, -1.097686767578125, -1.06097412109375, -1.024261474609375, -0.987548828125, -0.950836181640625, -0.91412353515625, -0.877410888671875, -0.8406982421875, -0.803985595703125, -0.76727294921875, -0.730560302734375, -0.69384765625, -0.657135009765625, -0.62042236328125, -0.583709716796875, -0.5469970703125, -0.510284423828125, -0.47357177734375, -0.436859130859375, -0.400146484375, -0.363433837890625, -0.32672119140625, -0.290008544921875, -0.2532958984375, -0.216583251953125, -0.17987060546875, -0.143157958984375, -0.1064453125, -0.069732666015625, -0.03302001953125, 0.003692626953125, 0.0404052734375, 0.077117919921875, 0.11383056640625, 0.150543212890625, 0.187255859375, 0.223968505859375, 0.26068115234375, 0.297393798828125, 0.3341064453125, 0.370819091796875, 0.40753173828125, 0.444244384765625, 0.48095703125, 0.517669677734375, 0.55438232421875, 0.591094970703125, 0.6278076171875, 0.664520263671875, 0.70123291015625, 0.737945556640625, 0.774658203125, 0.811370849609375, 0.84808349609375, 0.884796142578125, 0.9215087890625, 0.958221435546875, 0.99493408203125, 1.031646728515625, 1.068359375]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 13.0, 10.0, 10.0, 19.0, 28.0, 34.0, 19.0, 33.0, 35.0, 32.0, 34.0, 43.0, 56.0, 51.0, 60.0, 1080.0, 42.0, 52.0, 41.0, 51.0, 49.0, 41.0, 49.0, 30.0, 23.0, 14.0, 15.0, 24.0, 14.0, 11.0, 7.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2890625, -11.9112548828125, -11.533447265625, -11.1556396484375, -10.77783203125, -10.4000244140625, -10.022216796875, -9.6444091796875, -9.2666015625, -8.8887939453125, -8.510986328125, -8.1331787109375, -7.75537109375, -7.3775634765625, -6.999755859375, -6.6219482421875, -6.244140625, -5.8663330078125, -5.488525390625, -5.1107177734375, -4.73291015625, -4.3551025390625, -3.977294921875, -3.5994873046875, -3.2216796875, -2.8438720703125, -2.466064453125, -2.0882568359375, -1.71044921875, -1.3326416015625, -0.954833984375, -0.5770263671875, -0.19921875, 0.1785888671875, 0.556396484375, 0.9342041015625, 1.31201171875, 1.6898193359375, 2.067626953125, 2.4454345703125, 2.8232421875, 3.2010498046875, 3.578857421875, 3.9566650390625, 4.33447265625, 4.7122802734375, 5.090087890625, 5.4678955078125, 5.845703125, 6.2235107421875, 6.601318359375, 6.9791259765625, 7.35693359375, 7.7347412109375, 8.112548828125, 8.4903564453125, 8.8681640625, 9.2459716796875, 9.623779296875, 10.0015869140625, 10.37939453125, 10.7572021484375, 11.135009765625, 11.5128173828125, 11.890625]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 7.0, 7.0, 12.0, 13.0, 19.0, 36.0, 55.0, 88.0, 133.0, 213.0, 356.0, 602.0, 993.0, 1917.0, 3483.0, 6330.0, 11965.0, 23520.0, 47769.0, 101908.0, 243795.0, 1379966.0, 143230.0, 65172.0, 31590.0, 15625.0, 8266.0, 4477.0, 2400.0, 1292.0, 744.0, 432.0, 263.0, 141.0, 116.0, 70.0, 41.0, 32.0, 26.0, 10.0, 8.0, 5.0, 8.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.822265625, -1.76568603515625, -1.7091064453125, -1.65252685546875, -1.595947265625, -1.53936767578125, -1.4827880859375, -1.42620849609375, -1.36962890625, -1.31304931640625, -1.2564697265625, -1.19989013671875, -1.143310546875, -1.08673095703125, -1.0301513671875, -0.97357177734375, -0.9169921875, -0.86041259765625, -0.8038330078125, -0.74725341796875, -0.690673828125, -0.63409423828125, -0.5775146484375, -0.52093505859375, -0.46435546875, -0.40777587890625, -0.3511962890625, -0.29461669921875, -0.238037109375, -0.18145751953125, -0.1248779296875, -0.06829833984375, -0.01171875, 0.04486083984375, 0.1014404296875, 0.15802001953125, 0.214599609375, 0.27117919921875, 0.3277587890625, 0.38433837890625, 0.44091796875, 0.49749755859375, 0.5540771484375, 0.61065673828125, 0.667236328125, 0.72381591796875, 0.7803955078125, 0.83697509765625, 0.8935546875, 0.95013427734375, 1.0067138671875, 1.06329345703125, 1.119873046875, 1.17645263671875, 1.2330322265625, 1.28961181640625, 1.34619140625, 1.40277099609375, 1.4593505859375, 1.51593017578125, 1.572509765625, 1.62908935546875, 1.6856689453125, 1.74224853515625, 1.798828125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 7.0, 6.0, 4.0, 3.0, 10.0, 10.0, 11.0, 15.0, 14.0, 12.0, 17.0, 15.0, 21.0, 24.0, 29.0, 34.0, 32.0, 32.0, 48.0, 44.0, 43.0, 46.0, 45.0, 31.0, 39.0, 42.0, 42.0, 34.0, 40.0, 23.0, 27.0, 28.0, 25.0, 25.0, 21.0, 18.0, 18.0, 12.0, 5.0, 12.0, 11.0, 4.0, 6.0, 4.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.0025539398193359375, -0.002472132444381714, -0.0023903250694274902, -0.0023085176944732666, -0.002226710319519043, -0.0021449029445648193, -0.0020630955696105957, -0.001981288194656372, -0.0018994808197021484, -0.0018176734447479248, -0.0017358660697937012, -0.0016540586948394775, -0.001572251319885254, -0.0014904439449310303, -0.0014086365699768066, -0.001326829195022583, -0.0012450218200683594, -0.0011632144451141357, -0.0010814070701599121, -0.0009995996952056885, -0.0009177923202514648, -0.0008359849452972412, -0.0007541775703430176, -0.0006723701953887939, -0.0005905628204345703, -0.0005087554454803467, -0.00042694807052612305, -0.0003451406955718994, -0.0002633333206176758, -0.00018152594566345215, -9.971857070922852e-05, -1.7911195755004883e-05, 6.389617919921875e-05, 0.00014570355415344238, 0.00022751092910766602, 0.00030931830406188965, 0.0003911256790161133, 0.0004729330539703369, 0.0005547404289245605, 0.0006365478038787842, 0.0007183551788330078, 0.0008001625537872314, 0.0008819699287414551, 0.0009637773036956787, 0.0010455846786499023, 0.001127392053604126, 0.0012091994285583496, 0.0012910068035125732, 0.0013728141784667969, 0.0014546215534210205, 0.0015364289283752441, 0.0016182363033294678, 0.0017000436782836914, 0.001781851053237915, 0.0018636584281921387, 0.0019454658031463623, 0.002027273178100586, 0.0021090805530548096, 0.002190887928009033, 0.002272695302963257, 0.0023545026779174805, 0.002436310052871704, 0.0025181174278259277, 0.0025999248027801514, 0.002681732177734375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 8.0, 12.0, 15.0, 8.0, 10.0, 21.0, 27.0, 33.0, 39.0, 43.0, 57.0, 56.0, 64.0, 110.0, 171.0, 329.0, 1035.0, 17924.0, 965696.0, 59883.0, 1755.0, 428.0, 198.0, 125.0, 93.0, 68.0, 61.0, 56.0, 40.0, 26.0, 26.0, 26.0, 13.0, 14.0, 17.0, 15.0, 7.0, 3.0, 7.0, 7.0, 5.0, 0.0, 2.0, 2.0, 6.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0567626953125, -0.05496788024902344, -0.053173065185546875, -0.05137825012207031, -0.04958343505859375, -0.04778861999511719, -0.045993804931640625, -0.04419898986816406, -0.0424041748046875, -0.04060935974121094, -0.038814544677734375, -0.03701972961425781, -0.03522491455078125, -0.03343009948730469, -0.031635284423828125, -0.029840469360351562, -0.028045654296875, -0.026250839233398438, -0.024456024169921875, -0.022661209106445312, -0.02086639404296875, -0.019071578979492188, -0.017276763916015625, -0.015481948852539062, -0.0136871337890625, -0.011892318725585938, -0.010097503662109375, -0.008302688598632812, -0.00650787353515625, -0.0047130584716796875, -0.002918243408203125, -0.0011234283447265625, 0.00067138671875, 0.0024662017822265625, 0.004261016845703125, 0.0060558319091796875, 0.00785064697265625, 0.009645462036132812, 0.011440277099609375, 0.013235092163085938, 0.0150299072265625, 0.016824722290039062, 0.018619537353515625, 0.020414352416992188, 0.02220916748046875, 0.024003982543945312, 0.025798797607421875, 0.027593612670898438, 0.029388427734375, 0.031183242797851562, 0.032978057861328125, 0.03477287292480469, 0.03656768798828125, 0.03836250305175781, 0.040157318115234375, 0.04195213317871094, 0.0437469482421875, 0.04554176330566406, 0.047336578369140625, 0.04913139343261719, 0.05092620849609375, 0.05272102355957031, 0.054515838623046875, 0.05631065368652344, 0.05810546875]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [34.0, 566.0, 405.0, 15.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012609772384166718, -0.0006024329923093319, 5.6111253798007965e-05, 0.0007146554999053478, 0.0013731997460126877, 0.0020317439921200275, 0.0026902882382273674, 0.0033488324843347073, 0.004007376730442047, 0.004665920976549387, 0.005324465222656727, 0.005983009468764067, 0.0066415537148714066, 0.007300097960978746, 0.007958642207086086, 0.008617186918854713, 0.009275730699300766, 0.009934274479746819, 0.010592819191515446, 0.011251363903284073, 0.011909907683730125, 0.012568451464176178, 0.013226996175944805, 0.013885540887713432, 0.014544084668159485, 0.015202628448605537, 0.01586117222905159, 0.016519717872142792, 0.017178261652588844, 0.017836805433034897, 0.0184953510761261, 0.01915389485657215, 0.019812438637018204, 0.020470982417464256, 0.02112952619791031, 0.02178807184100151, 0.022446615621447563, 0.023105159401893616, 0.023763705044984818, 0.02442224882543087, 0.025080792605876923, 0.025739336386322975, 0.026397880166769028, 0.02705642580986023, 0.027714969590306282, 0.028373513370752335, 0.029032059013843536, 0.02969060279428959, 0.03034914657473564, 0.031007690355181694, 0.03166623413562775, 0.03232477977871895, 0.03298332542181015, 0.03364186733961105, 0.034300412982702255, 0.03495895490050316, 0.03561750054359436, 0.03627604618668556, 0.036934588104486465, 0.03759313374757767, 0.03825167566537857, 0.03891022130846977, 0.039568766951560974, 0.04022730886936188, 0.04088585451245308]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 6.0, 8.0, 10.0, 10.0, 18.0, 22.0, 24.0, 19.0, 25.0, 28.0, 30.0, 26.0, 41.0, 39.0, 39.0, 34.0, 38.0, 47.0, 43.0, 41.0, 41.0, 30.0, 35.0, 35.0, 30.0, 32.0, 38.0, 28.0, 31.0, 26.0, 26.0, 18.0, 15.0, 13.0, 9.0, 7.0, 8.0, 6.0, 3.0, 6.0, 4.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0], "bins": [-0.001893460750579834, -0.0018409043550491333, -0.0017883479595184326, -0.001735791563987732, -0.0016832351684570312, -0.0016306787729263306, -0.0015781223773956299, -0.0015255659818649292, -0.0014730095863342285, -0.0014204531908035278, -0.0013678967952728271, -0.0013153403997421265, -0.0012627840042114258, -0.001210227608680725, -0.0011576712131500244, -0.0011051148176193237, -0.001052558422088623, -0.0010000020265579224, -0.0009474456310272217, -0.000894889235496521, -0.0008423328399658203, -0.0007897764444351196, -0.0007372200489044189, -0.0006846636533737183, -0.0006321072578430176, -0.0005795508623123169, -0.0005269944667816162, -0.00047443807125091553, -0.00042188167572021484, -0.00036932528018951416, -0.0003167688846588135, -0.0002642124891281128, -0.0002116560935974121, -0.00015909969806671143, -0.00010654330253601074, -5.398690700531006e-05, -1.430511474609375e-06, 5.112588405609131e-05, 0.00010368227958679199, 0.00015623867511749268, 0.00020879507064819336, 0.00026135146617889404, 0.0003139078617095947, 0.0003664642572402954, 0.0004190206527709961, 0.0004715770483016968, 0.0005241334438323975, 0.0005766898393630981, 0.0006292462348937988, 0.0006818026304244995, 0.0007343590259552002, 0.0007869154214859009, 0.0008394718170166016, 0.0008920282125473022, 0.0009445846080780029, 0.0009971410036087036, 0.0010496973991394043, 0.001102253794670105, 0.0011548101902008057, 0.0012073665857315063, 0.001259922981262207, 0.0013124793767929077, 0.0013650357723236084, 0.001417592167854309, 0.0014701485633850098]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 3.0, 7.0, 10.0, 7.0, 7.0, 17.0, 13.0, 18.0, 14.0, 27.0, 16.0, 34.0, 31.0, 37.0, 41.0, 41.0, 31.0, 36.0, 45.0, 37.0, 36.0, 46.0, 39.0, 36.0, 50.0, 24.0, 30.0, 29.0, 27.0, 23.0, 27.0, 18.0, 24.0, 19.0, 11.0, 15.0, 14.0, 10.0, 9.0, 5.0, 5.0, 3.0, 5.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.953125, -14.5069580078125, -14.060791015625, -13.6146240234375, -13.16845703125, -12.7222900390625, -12.276123046875, -11.8299560546875, -11.3837890625, -10.9376220703125, -10.491455078125, -10.0452880859375, -9.59912109375, -9.1529541015625, -8.706787109375, -8.2606201171875, -7.814453125, -7.3682861328125, -6.922119140625, -6.4759521484375, -6.02978515625, -5.5836181640625, -5.137451171875, -4.6912841796875, -4.2451171875, -3.7989501953125, -3.352783203125, -2.9066162109375, -2.46044921875, -2.0142822265625, -1.568115234375, -1.1219482421875, -0.67578125, -0.2296142578125, 0.216552734375, 0.6627197265625, 1.10888671875, 1.5550537109375, 2.001220703125, 2.4473876953125, 2.8935546875, 3.3397216796875, 3.785888671875, 4.2320556640625, 4.67822265625, 5.1243896484375, 5.570556640625, 6.0167236328125, 6.462890625, 6.9090576171875, 7.355224609375, 7.8013916015625, 8.24755859375, 8.6937255859375, 9.139892578125, 9.5860595703125, 10.0322265625, 10.4783935546875, 10.924560546875, 11.3707275390625, 11.81689453125, 12.2630615234375, 12.709228515625, 13.1553955078125, 13.6015625]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 3.0, 6.0, 4.0, 16.0, 15.0, 14.0, 21.0, 26.0, 32.0, 48.0, 86.0, 102.0, 137.0, 193.0, 276.0, 344.0, 547.0, 758.0, 1110.0, 1839.0, 2886.0, 5107.0, 10602.0, 28757.0, 130119.0, 672978.0, 138243.0, 29420.0, 11020.0, 5357.0, 2961.0, 1748.0, 1094.0, 791.0, 510.0, 334.0, 297.0, 191.0, 142.0, 102.0, 89.0, 64.0, 43.0, 36.0, 23.0, 17.0, 8.0, 11.0, 10.0, 11.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.6875, -14.249267578125, -13.81103515625, -13.372802734375, -12.9345703125, -12.496337890625, -12.05810546875, -11.619873046875, -11.181640625, -10.743408203125, -10.30517578125, -9.866943359375, -9.4287109375, -8.990478515625, -8.55224609375, -8.114013671875, -7.67578125, -7.237548828125, -6.79931640625, -6.361083984375, -5.9228515625, -5.484619140625, -5.04638671875, -4.608154296875, -4.169921875, -3.731689453125, -3.29345703125, -2.855224609375, -2.4169921875, -1.978759765625, -1.54052734375, -1.102294921875, -0.6640625, -0.225830078125, 0.21240234375, 0.650634765625, 1.0888671875, 1.527099609375, 1.96533203125, 2.403564453125, 2.841796875, 3.280029296875, 3.71826171875, 4.156494140625, 4.5947265625, 5.032958984375, 5.47119140625, 5.909423828125, 6.34765625, 6.785888671875, 7.22412109375, 7.662353515625, 8.1005859375, 8.538818359375, 8.97705078125, 9.415283203125, 9.853515625, 10.291748046875, 10.72998046875, 11.168212890625, 11.6064453125, 12.044677734375, 12.48291015625, 12.921142578125, 13.359375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 11.0, 8.0, 11.0, 18.0, 14.0, 15.0, 14.0, 19.0, 20.0, 31.0, 26.0, 37.0, 39.0, 45.0, 52.0, 49.0, 98.0, 1720.0, 294.0, 82.0, 50.0, 50.0, 32.0, 40.0, 38.0, 41.0, 29.0, 24.0, 23.0, 30.0, 13.0, 11.0, 12.0, 7.0, 12.0, 6.0, 5.0, 1.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.375, -42.78173828125, -41.1884765625, -39.59521484375, -38.001953125, -36.40869140625, -34.8154296875, -33.22216796875, -31.62890625, -30.03564453125, -28.4423828125, -26.84912109375, -25.255859375, -23.66259765625, -22.0693359375, -20.47607421875, -18.8828125, -17.28955078125, -15.6962890625, -14.10302734375, -12.509765625, -10.91650390625, -9.3232421875, -7.72998046875, -6.13671875, -4.54345703125, -2.9501953125, -1.35693359375, 0.236328125, 1.82958984375, 3.4228515625, 5.01611328125, 6.609375, 8.20263671875, 9.7958984375, 11.38916015625, 12.982421875, 14.57568359375, 16.1689453125, 17.76220703125, 19.35546875, 20.94873046875, 22.5419921875, 24.13525390625, 25.728515625, 27.32177734375, 28.9150390625, 30.50830078125, 32.1015625, 33.69482421875, 35.2880859375, 36.88134765625, 38.474609375, 40.06787109375, 41.6611328125, 43.25439453125, 44.84765625, 46.44091796875, 48.0341796875, 49.62744140625, 51.220703125, 52.81396484375, 54.4072265625, 56.00048828125, 57.59375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 7.0, 16.0, 12.0, 23.0, 25.0, 41.0, 82.0, 161.0, 252.0, 647.0, 6758.0, 3129752.0, 6714.0, 618.0, 235.0, 144.0, 59.0, 48.0, 43.0, 20.0, 16.0, 5.0, 4.0, 1.0, 6.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-236.875, -229.5859375, -222.296875, -215.0078125, -207.71875, -200.4296875, -193.140625, -185.8515625, -178.5625, -171.2734375, -163.984375, -156.6953125, -149.40625, -142.1171875, -134.828125, -127.5390625, -120.25, -112.9609375, -105.671875, -98.3828125, -91.09375, -83.8046875, -76.515625, -69.2265625, -61.9375, -54.6484375, -47.359375, -40.0703125, -32.78125, -25.4921875, -18.203125, -10.9140625, -3.625, 3.6640625, 10.953125, 18.2421875, 25.53125, 32.8203125, 40.109375, 47.3984375, 54.6875, 61.9765625, 69.265625, 76.5546875, 83.84375, 91.1328125, 98.421875, 105.7109375, 113.0, 120.2890625, 127.578125, 134.8671875, 142.15625, 149.4453125, 156.734375, 164.0234375, 171.3125, 178.6015625, 185.890625, 193.1796875, 200.46875, 207.7578125, 215.046875, 222.3359375, 229.625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 147.0, 729.0, 123.0, 13.0], "bins": [-518.8047485351562, -510.3590087890625, -501.91326904296875, -493.4675598144531, -485.0218200683594, -476.5760803222656, -468.1303405761719, -459.6846008300781, -451.2388916015625, -442.79315185546875, -434.347412109375, -425.9017028808594, -417.4559631347656, -409.0102233886719, -400.5644836425781, -392.1187438964844, -383.6730041503906, -375.2272644042969, -366.7815246582031, -358.3358154296875, -349.89007568359375, -341.4443359375, -332.99859619140625, -324.5528564453125, -316.10711669921875, -307.661376953125, -299.21563720703125, -290.7699279785156, -282.3241882324219, -273.8784484863281, -265.4327087402344, -256.9869689941406, -248.54129028320312, -240.09555053710938, -231.6498260498047, -223.20408630371094, -214.75836181640625, -206.3126220703125, -197.86688232421875, -189.421142578125, -180.9754180908203, -172.52967834472656, -164.08395385742188, -155.63821411132812, -147.19247436523438, -138.7467498779297, -130.30101013183594, -121.85527801513672, -113.4095458984375, -104.96381378173828, -96.51808166503906, -88.07234191894531, -79.6266098022461, -71.18087768554688, -62.73514175415039, -54.289405822753906, -45.84366989135742, -37.39793395996094, -28.95220184326172, -20.506467819213867, -12.060733795166016, -3.615001678466797, 4.8307342529296875, 13.276470184326172, 21.72220230102539]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 4.0, 6.0, 8.0, 9.0, 9.0, 11.0, 13.0, 13.0, 14.0, 18.0, 25.0, 15.0, 25.0, 24.0, 34.0, 27.0, 35.0, 38.0, 29.0, 32.0, 34.0, 52.0, 37.0, 44.0, 28.0, 47.0, 44.0, 36.0, 35.0, 29.0, 27.0, 25.0, 24.0, 21.0, 18.0, 22.0, 12.0, 15.0, 10.0, 6.0, 8.0, 10.0, 7.0, 8.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-110.14775085449219, -106.5885238647461, -103.029296875, -99.4700698852539, -95.91084289550781, -92.35162353515625, -88.79239654541016, -85.23316955566406, -81.67394256591797, -78.11471557617188, -74.55548858642578, -70.99626159667969, -67.43704223632812, -63.877811431884766, -60.31858825683594, -56.759361267089844, -53.20013427734375, -49.640907287597656, -46.08168029785156, -42.522457122802734, -38.96323013305664, -35.40400314331055, -31.844778060913086, -28.285552978515625, -24.72632598876953, -21.167098999023438, -17.607873916625977, -14.0486478805542, -10.489421844482422, -6.930194854736328, -3.370969772338867, 0.18825531005859375, 3.7474899291992188, 7.306715965270996, 10.865942001342773, 14.42516803741455, 17.984394073486328, 21.543621063232422, 25.102846145629883, 28.662071228027344, 32.22129821777344, 35.78052520751953, 39.339752197265625, 42.89897537231445, 46.45820236206055, 50.01742935180664, 53.57665252685547, 57.13587951660156, 60.695106506347656, 64.25433349609375, 67.81356048583984, 71.37278747558594, 74.9320068359375, 78.49124145507812, 82.05046081542969, 85.60968780517578, 89.16891479492188, 92.72814178466797, 96.28736877441406, 99.84659576416016, 103.40582275390625, 106.96504211425781, 110.5242691040039, 114.08349609375, 117.6427230834961]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 5.0, 1.0, 5.0, 8.0, 5.0, 8.0, 14.0, 9.0, 17.0, 16.0, 17.0, 15.0, 17.0, 26.0, 30.0, 35.0, 43.0, 28.0, 42.0, 36.0, 42.0, 31.0, 42.0, 31.0, 52.0, 33.0, 43.0, 32.0, 34.0, 19.0, 29.0, 37.0, 28.0, 15.0, 22.0, 16.0, 23.0, 9.0, 8.0, 21.0, 14.0, 9.0, 6.0, 1.0, 3.0, 5.0, 5.0, 6.0, 3.0, 1.0, 5.0, 3.0, 1.0], "bins": [-15.6640625, -15.2066650390625, -14.749267578125, -14.2918701171875, -13.83447265625, -13.3770751953125, -12.919677734375, -12.4622802734375, -12.0048828125, -11.5474853515625, -11.090087890625, -10.6326904296875, -10.17529296875, -9.7178955078125, -9.260498046875, -8.8031005859375, -8.345703125, -7.8883056640625, -7.430908203125, -6.9735107421875, -6.51611328125, -6.0587158203125, -5.601318359375, -5.1439208984375, -4.6865234375, -4.2291259765625, -3.771728515625, -3.3143310546875, -2.85693359375, -2.3995361328125, -1.942138671875, -1.4847412109375, -1.02734375, -0.5699462890625, -0.112548828125, 0.3448486328125, 0.80224609375, 1.2596435546875, 1.717041015625, 2.1744384765625, 2.6318359375, 3.0892333984375, 3.546630859375, 4.0040283203125, 4.46142578125, 4.9188232421875, 5.376220703125, 5.8336181640625, 6.291015625, 6.7484130859375, 7.205810546875, 7.6632080078125, 8.12060546875, 8.5780029296875, 9.035400390625, 9.4927978515625, 9.9501953125, 10.4075927734375, 10.864990234375, 11.3223876953125, 11.77978515625, 12.2371826171875, 12.694580078125, 13.1519775390625, 13.609375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 6.0, 6.0, 9.0, 8.0, 11.0, 17.0, 9.0, 22.0, 32.0, 26.0, 51.0, 43.0, 75.0, 70.0, 117.0, 167.0, 252.0, 413.0, 714.0, 1408.0, 3327.0, 8640.0, 91062.0, 2350805.0, 1668577.0, 54325.0, 7618.0, 2969.0, 1458.0, 747.0, 408.0, 252.0, 138.0, 104.0, 66.0, 57.0, 51.0, 50.0, 32.0, 28.0, 24.0, 23.0, 8.0, 21.0, 10.0, 7.0, 6.0, 1.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-47.59375, -46.19091796875, -44.7880859375, -43.38525390625, -41.982421875, -40.57958984375, -39.1767578125, -37.77392578125, -36.37109375, -34.96826171875, -33.5654296875, -32.16259765625, -30.759765625, -29.35693359375, -27.9541015625, -26.55126953125, -25.1484375, -23.74560546875, -22.3427734375, -20.93994140625, -19.537109375, -18.13427734375, -16.7314453125, -15.32861328125, -13.92578125, -12.52294921875, -11.1201171875, -9.71728515625, -8.314453125, -6.91162109375, -5.5087890625, -4.10595703125, -2.703125, -1.30029296875, 0.1025390625, 1.50537109375, 2.908203125, 4.31103515625, 5.7138671875, 7.11669921875, 8.51953125, 9.92236328125, 11.3251953125, 12.72802734375, 14.130859375, 15.53369140625, 16.9365234375, 18.33935546875, 19.7421875, 21.14501953125, 22.5478515625, 23.95068359375, 25.353515625, 26.75634765625, 28.1591796875, 29.56201171875, 30.96484375, 32.36767578125, 33.7705078125, 35.17333984375, 36.576171875, 37.97900390625, 39.3818359375, 40.78466796875, 42.1875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 12.0, 21.0, 25.0, 73.0, 183.0, 377.0, 1188.0, 1282.0, 517.0, 184.0, 79.0, 47.0, 33.0, 17.0, 6.0, 8.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.8125, -54.7880859375, -52.763671875, -50.7392578125, -48.71484375, -46.6904296875, -44.666015625, -42.6416015625, -40.6171875, -38.5927734375, -36.568359375, -34.5439453125, -32.51953125, -30.4951171875, -28.470703125, -26.4462890625, -24.421875, -22.3974609375, -20.373046875, -18.3486328125, -16.32421875, -14.2998046875, -12.275390625, -10.2509765625, -8.2265625, -6.2021484375, -4.177734375, -2.1533203125, -0.12890625, 1.8955078125, 3.919921875, 5.9443359375, 7.96875, 9.9931640625, 12.017578125, 14.0419921875, 16.06640625, 18.0908203125, 20.115234375, 22.1396484375, 24.1640625, 26.1884765625, 28.212890625, 30.2373046875, 32.26171875, 34.2861328125, 36.310546875, 38.3349609375, 40.359375, 42.3837890625, 44.408203125, 46.4326171875, 48.45703125, 50.4814453125, 52.505859375, 54.5302734375, 56.5546875, 58.5791015625, 60.603515625, 62.6279296875, 64.65234375, 66.6767578125, 68.701171875, 70.7255859375, 72.75]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 15.0, 26.0, 46.0, 100.0, 248.0, 850.0, 10028.0, 4153601.0, 27528.0, 1275.0, 339.0, 107.0, 50.0, 25.0, 11.0, 7.0, 7.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-301.75, -293.27734375, -284.8046875, -276.33203125, -267.859375, -259.38671875, -250.9140625, -242.44140625, -233.96875, -225.49609375, -217.0234375, -208.55078125, -200.078125, -191.60546875, -183.1328125, -174.66015625, -166.1875, -157.71484375, -149.2421875, -140.76953125, -132.296875, -123.82421875, -115.3515625, -106.87890625, -98.40625, -89.93359375, -81.4609375, -72.98828125, -64.515625, -56.04296875, -47.5703125, -39.09765625, -30.625, -22.15234375, -13.6796875, -5.20703125, 3.265625, 11.73828125, 20.2109375, 28.68359375, 37.15625, 45.62890625, 54.1015625, 62.57421875, 71.046875, 79.51953125, 87.9921875, 96.46484375, 104.9375, 113.41015625, 121.8828125, 130.35546875, 138.828125, 147.30078125, 155.7734375, 164.24609375, 172.71875, 181.19140625, 189.6640625, 198.13671875, 206.609375, 215.08203125, 223.5546875, 232.02734375, 240.5]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 7.0, 16.0, 24.0, 40.0, 90.0, 178.0, 275.0, 203.0, 86.0, 48.0, 22.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-273.86688232421875, -266.5318603515625, -259.1968688964844, -251.86184692382812, -244.52684020996094, -237.19183349609375, -229.85682678222656, -222.52182006835938, -215.18679809570312, -207.85179138183594, -200.51678466796875, -193.1817626953125, -185.8467559814453, -178.51174926757812, -171.17674255371094, -163.84173583984375, -156.50672912597656, -149.17172241210938, -141.8367156982422, -134.501708984375, -127.16668701171875, -119.83168029785156, -112.49667358398438, -105.16166687011719, -97.82665252685547, -90.49164581298828, -83.15663146972656, -75.82162475585938, -68.48661804199219, -61.15160369873047, -53.81659698486328, -46.48158645629883, -39.14659118652344, -31.811580657958984, -24.476572036743164, -17.141563415527344, -9.80655288696289, -2.4715423583984375, 4.86346435546875, 12.198474884033203, 19.533485412597656, 26.86849594116211, 34.20350646972656, 41.53851318359375, 48.8735237121582, 56.208534240722656, 63.543540954589844, 70.87855529785156, 78.21356201171875, 85.54856872558594, 92.88358306884766, 100.21858978271484, 107.55360412597656, 114.88861083984375, 122.22361755371094, 129.55862426757812, 136.89364624023438, 144.22865295410156, 151.56365966796875, 158.898681640625, 166.2336883544922, 173.56869506835938, 180.90370178222656, 188.23870849609375, 195.57371520996094]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 4.0, 14.0, 14.0, 20.0, 16.0, 16.0, 22.0, 26.0, 28.0, 25.0, 34.0, 36.0, 45.0, 31.0, 36.0, 37.0, 40.0, 37.0, 43.0, 41.0, 36.0, 42.0, 39.0, 36.0, 41.0, 29.0, 34.0, 30.0, 19.0, 19.0, 23.0, 18.0, 14.0, 12.0, 9.0, 4.0, 8.0, 9.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.33390808105469, -83.4459228515625, -80.55792999267578, -77.6699447631836, -74.78195190429688, -71.89396667480469, -69.0059814453125, -66.11798858642578, -63.230003356933594, -60.34201431274414, -57.45402526855469, -54.5660400390625, -51.67805099487305, -48.790061950683594, -45.90207290649414, -43.01408386230469, -40.126094818115234, -37.23810577392578, -34.35011672973633, -31.462129592895508, -28.574142456054688, -25.686153411865234, -22.79816436767578, -19.91017723083496, -17.022188186645508, -14.134200096130371, -11.246212005615234, -8.358222961425781, -5.4702348709106445, -2.582246780395508, 0.3057422637939453, 3.1937294006347656, 6.081718444824219, 8.969706535339355, 11.857694625854492, 14.745683670043945, 17.633670806884766, 20.52165985107422, 23.409648895263672, 26.297636032104492, 29.185625076293945, 32.073612213134766, 34.96160125732422, 37.84959030151367, 40.737579345703125, 43.62556457519531, 46.51355743408203, 49.40154266357422, 52.28953170776367, 55.177520751953125, 58.06550979614258, 60.95349884033203, 63.84148406982422, 66.72947692871094, 69.61746215820312, 72.50544738769531, 75.39344024658203, 78.28142547607422, 81.16941833496094, 84.05740356445312, 86.94539642333984, 89.83338165283203, 92.72137451171875, 95.60935974121094, 98.49734497070312]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 11.0, 10.0, 12.0, 19.0, 19.0, 19.0, 19.0, 24.0, 28.0, 29.0, 30.0, 49.0, 44.0, 56.0, 47.0, 45.0, 47.0, 38.0, 50.0, 47.0, 31.0, 35.0, 31.0, 30.0, 27.0, 29.0, 19.0, 32.0, 22.0, 15.0, 17.0, 14.0, 10.0, 6.0, 8.0, 4.0, 5.0, 2.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.15625, -17.6353759765625, -17.114501953125, -16.5936279296875, -16.07275390625, -15.5518798828125, -15.031005859375, -14.5101318359375, -13.9892578125, -13.4683837890625, -12.947509765625, -12.4266357421875, -11.90576171875, -11.3848876953125, -10.864013671875, -10.3431396484375, -9.822265625, -9.3013916015625, -8.780517578125, -8.2596435546875, -7.73876953125, -7.2178955078125, -6.697021484375, -6.1761474609375, -5.6552734375, -5.1343994140625, -4.613525390625, -4.0926513671875, -3.57177734375, -3.0509033203125, -2.530029296875, -2.0091552734375, -1.48828125, -0.9674072265625, -0.446533203125, 0.0743408203125, 0.59521484375, 1.1160888671875, 1.636962890625, 2.1578369140625, 2.6787109375, 3.1995849609375, 3.720458984375, 4.2413330078125, 4.76220703125, 5.2830810546875, 5.803955078125, 6.3248291015625, 6.845703125, 7.3665771484375, 7.887451171875, 8.4083251953125, 8.92919921875, 9.4500732421875, 9.970947265625, 10.4918212890625, 11.0126953125, 11.5335693359375, 12.054443359375, 12.5753173828125, 13.09619140625, 13.6170654296875, 14.137939453125, 14.6588134765625, 15.1796875]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 7.0, 19.0, 26.0, 29.0, 45.0, 71.0, 132.0, 208.0, 281.0, 545.0, 875.0, 1420.0, 2475.0, 3987.0, 6823.0, 11400.0, 20161.0, 35251.0, 66420.0, 134352.0, 278981.0, 241588.0, 113491.0, 56882.0, 30681.0, 17388.0, 10054.0, 5981.0, 3653.0, 2155.0, 1209.0, 723.0, 459.0, 295.0, 161.0, 120.0, 63.0, 55.0, 29.0, 22.0, 13.0, 10.0, 11.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.78515625, -1.730865478515625, -1.67657470703125, -1.622283935546875, -1.5679931640625, -1.513702392578125, -1.45941162109375, -1.405120849609375, -1.350830078125, -1.296539306640625, -1.24224853515625, -1.187957763671875, -1.1336669921875, -1.079376220703125, -1.02508544921875, -0.970794677734375, -0.91650390625, -0.862213134765625, -0.80792236328125, -0.753631591796875, -0.6993408203125, -0.645050048828125, -0.59075927734375, -0.536468505859375, -0.482177734375, -0.427886962890625, -0.37359619140625, -0.319305419921875, -0.2650146484375, -0.210723876953125, -0.15643310546875, -0.102142333984375, -0.0478515625, 0.006439208984375, 0.06072998046875, 0.115020751953125, 0.1693115234375, 0.223602294921875, 0.27789306640625, 0.332183837890625, 0.386474609375, 0.440765380859375, 0.49505615234375, 0.549346923828125, 0.6036376953125, 0.657928466796875, 0.71221923828125, 0.766510009765625, 0.82080078125, 0.875091552734375, 0.92938232421875, 0.983673095703125, 1.0379638671875, 1.092254638671875, 1.14654541015625, 1.200836181640625, 1.255126953125, 1.309417724609375, 1.36370849609375, 1.417999267578125, 1.4722900390625, 1.526580810546875, 1.58087158203125, 1.635162353515625, 1.689453125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 8.0, 6.0, 11.0, 7.0, 14.0, 16.0, 23.0, 12.0, 31.0, 23.0, 26.0, 30.0, 28.0, 40.0, 40.0, 40.0, 46.0, 46.0, 47.0, 1073.0, 41.0, 44.0, 56.0, 39.0, 17.0, 36.0, 37.0, 27.0, 22.0, 24.0, 26.0, 12.0, 18.0, 14.0, 8.0, 10.0, 5.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 7.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.8984375, -10.5635986328125, -10.228759765625, -9.8939208984375, -9.55908203125, -9.2242431640625, -8.889404296875, -8.5545654296875, -8.2197265625, -7.8848876953125, -7.550048828125, -7.2152099609375, -6.88037109375, -6.5455322265625, -6.210693359375, -5.8758544921875, -5.541015625, -5.2061767578125, -4.871337890625, -4.5364990234375, -4.20166015625, -3.8668212890625, -3.531982421875, -3.1971435546875, -2.8623046875, -2.5274658203125, -2.192626953125, -1.8577880859375, -1.52294921875, -1.1881103515625, -0.853271484375, -0.5184326171875, -0.18359375, 0.1512451171875, 0.486083984375, 0.8209228515625, 1.15576171875, 1.4906005859375, 1.825439453125, 2.1602783203125, 2.4951171875, 2.8299560546875, 3.164794921875, 3.4996337890625, 3.83447265625, 4.1693115234375, 4.504150390625, 4.8389892578125, 5.173828125, 5.5086669921875, 5.843505859375, 6.1783447265625, 6.51318359375, 6.8480224609375, 7.182861328125, 7.5177001953125, 7.8525390625, 8.1873779296875, 8.522216796875, 8.8570556640625, 9.19189453125, 9.5267333984375, 9.861572265625, 10.1964111328125, 10.53125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 4.0, 2.0, 8.0, 8.0, 6.0, 9.0, 14.0, 16.0, 28.0, 37.0, 64.0, 65.0, 103.0, 177.0, 252.0, 405.0, 584.0, 937.0, 1427.0, 2274.0, 3642.0, 5550.0, 8970.0, 15155.0, 25535.0, 44850.0, 82298.0, 163745.0, 1341716.0, 186340.0, 91632.0, 49934.0, 28274.0, 16356.0, 9955.0, 5963.0, 3809.0, 2505.0, 1506.0, 1000.0, 684.0, 411.0, 287.0, 176.0, 128.0, 88.0, 68.0, 47.0, 28.0, 25.0, 19.0, 7.0, 8.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.5751953125, -1.52685546875, -1.478515625, -1.43017578125, -1.3818359375, -1.33349609375, -1.28515625, -1.23681640625, -1.1884765625, -1.14013671875, -1.091796875, -1.04345703125, -0.9951171875, -0.94677734375, -0.8984375, -0.85009765625, -0.8017578125, -0.75341796875, -0.705078125, -0.65673828125, -0.6083984375, -0.56005859375, -0.51171875, -0.46337890625, -0.4150390625, -0.36669921875, -0.318359375, -0.27001953125, -0.2216796875, -0.17333984375, -0.125, -0.07666015625, -0.0283203125, 0.02001953125, 0.068359375, 0.11669921875, 0.1650390625, 0.21337890625, 0.26171875, 0.31005859375, 0.3583984375, 0.40673828125, 0.455078125, 0.50341796875, 0.5517578125, 0.60009765625, 0.6484375, 0.69677734375, 0.7451171875, 0.79345703125, 0.841796875, 0.89013671875, 0.9384765625, 0.98681640625, 1.03515625, 1.08349609375, 1.1318359375, 1.18017578125, 1.228515625, 1.27685546875, 1.3251953125, 1.37353515625, 1.421875, 1.47021484375, 1.5185546875]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 8.0, 3.0, 13.0, 12.0, 9.0, 16.0, 17.0, 22.0, 28.0, 30.0, 38.0, 34.0, 50.0, 51.0, 45.0, 61.0, 51.0, 55.0, 53.0, 56.0, 43.0, 41.0, 39.0, 37.0, 29.0, 26.0, 25.0, 18.0, 13.0, 8.0, 8.0, 11.0, 13.0, 13.0, 10.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030040740966796875, -0.0028967559337615967, -0.002789437770843506, -0.002682119607925415, -0.0025748014450073242, -0.0024674832820892334, -0.0023601651191711426, -0.0022528469562530518, -0.002145528793334961, -0.00203821063041687, -0.0019308924674987793, -0.0018235743045806885, -0.0017162561416625977, -0.0016089379787445068, -0.001501619815826416, -0.0013943016529083252, -0.0012869834899902344, -0.0011796653270721436, -0.0010723471641540527, -0.0009650290012359619, -0.0008577108383178711, -0.0007503926753997803, -0.0006430745124816895, -0.0005357563495635986, -0.0004284381866455078, -0.000321120023727417, -0.00021380186080932617, -0.00010648369789123535, 8.344650268554688e-07, 0.00010815262794494629, 0.0002154707908630371, 0.00032278895378112793, 0.00043010711669921875, 0.0005374252796173096, 0.0006447434425354004, 0.0007520616054534912, 0.000859379768371582, 0.0009666979312896729, 0.0010740160942077637, 0.0011813342571258545, 0.0012886524200439453, 0.0013959705829620361, 0.001503288745880127, 0.0016106069087982178, 0.0017179250717163086, 0.0018252432346343994, 0.0019325613975524902, 0.002039879560470581, 0.002147197723388672, 0.0022545158863067627, 0.0023618340492248535, 0.0024691522121429443, 0.002576470375061035, 0.002683788537979126, 0.002791106700897217, 0.0028984248638153076, 0.0030057430267333984, 0.0031130611896514893, 0.00322037935256958, 0.003327697515487671, 0.0034350156784057617, 0.0035423338413238525, 0.0036496520042419434, 0.003756970167160034, 0.003864288330078125]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 12.0, 11.0, 14.0, 17.0, 12.0, 14.0, 26.0, 33.0, 44.0, 54.0, 58.0, 80.0, 101.0, 145.0, 317.0, 963.0, 48984.0, 989315.0, 6972.0, 582.0, 243.0, 126.0, 99.0, 86.0, 56.0, 45.0, 38.0, 22.0, 18.0, 16.0, 11.0, 12.0, 10.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0860595703125, -0.08369064331054688, -0.08132171630859375, -0.07895278930664062, -0.0765838623046875, -0.07421493530273438, -0.07184600830078125, -0.06947708129882812, -0.067108154296875, -0.06473922729492188, -0.06237030029296875, -0.060001373291015625, -0.0576324462890625, -0.055263519287109375, -0.05289459228515625, -0.050525665283203125, -0.04815673828125, -0.045787811279296875, -0.04341888427734375, -0.041049957275390625, -0.0386810302734375, -0.036312103271484375, -0.03394317626953125, -0.031574249267578125, -0.029205322265625, -0.026836395263671875, -0.02446746826171875, -0.022098541259765625, -0.0197296142578125, -0.017360687255859375, -0.01499176025390625, -0.012622833251953125, -0.01025390625, -0.007884979248046875, -0.00551605224609375, -0.003147125244140625, -0.0007781982421875, 0.001590728759765625, 0.00395965576171875, 0.006328582763671875, 0.008697509765625, 0.011066436767578125, 0.01343536376953125, 0.015804290771484375, 0.0181732177734375, 0.020542144775390625, 0.02291107177734375, 0.025279998779296875, 0.02764892578125, 0.030017852783203125, 0.03238677978515625, 0.034755706787109375, 0.0371246337890625, 0.039493560791015625, 0.04186248779296875, 0.044231414794921875, 0.046600341796875, 0.048969268798828125, 0.05133819580078125, 0.053707122802734375, 0.0560760498046875, 0.058444976806640625, 0.06081390380859375, 0.06318283081054688, 0.0655517578125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 9.0, 12.0, 25.0, 45.0, 122.0, 172.0, 193.0, 171.0, 139.0, 65.0, 27.0, 13.0, 11.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0049862307496368885, -0.0048604304902255535, -0.0047346302308142185, -0.004608829505741596, -0.004483029246330261, -0.004357228986918926, -0.004231428727507591, -0.004105628468096256, -0.003979828208684921, -0.0038540279492735863, -0.0037282274570316076, -0.0036024271976202726, -0.003476626705378294, -0.003350826445966959, -0.003225026186555624, -0.003099225927144289, -0.0029734252020716667, -0.0028476249426603317, -0.002721824450418353, -0.002596024191007018, -0.0024702236987650394, -0.0023444234393537045, -0.0022186231799423695, -0.0020928229205310345, -0.001967022428289056, -0.001841222052462399, -0.0017154216766357422, -0.0015896214172244072, -0.0014638210413977504, -0.0013380206655710936, -0.0012122204061597586, -0.0010864200303331017, -0.0009606201201677322, -0.0008348197443410754, -0.0007090194267220795, -0.0005832191091030836, -0.0004574187332764268, -0.00033161835744977, -0.00020581803983077407, -8.001772221177816e-05, 4.5782653614878654e-05, 0.00017158300033770502, 0.0002973833470605314, 0.00042318369378335774, 0.0005489840405061841, 0.0006747844163328409, 0.0008005847339518368, 0.0009263850515708327, 0.0010521854273974895, 0.0011779858032241464, 0.0013037861790508032, 0.0014295864384621382, 0.001555386814288795, 0.0016811871901154518, 0.0018069874495267868, 0.0019327878253534436, 0.0020585882011801004, 0.0021843884605914354, 0.002310188952833414, 0.002435989212244749, 0.002561789471656084, 0.0026875899638980627, 0.0028133902233093977, 0.0029391907155513763, 0.0030649909749627113]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 6.0, 3.0, 4.0, 11.0, 12.0, 16.0, 8.0, 17.0, 18.0, 21.0, 23.0, 24.0, 41.0, 26.0, 41.0, 40.0, 23.0, 39.0, 33.0, 44.0, 46.0, 40.0, 36.0, 46.0, 35.0, 37.0, 28.0, 40.0, 29.0, 26.0, 33.0, 27.0, 16.0, 22.0, 13.0, 11.0, 14.0, 8.0, 8.0, 9.0, 4.0, 7.0, 5.0, 3.0, 2.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018587112426757812, -0.0018023783341050148, -0.0017460454255342484, -0.001689712516963482, -0.0016333796083927155, -0.001577046699821949, -0.0015207137912511826, -0.001464380882680416, -0.0014080479741096497, -0.0013517150655388832, -0.0012953821569681168, -0.0012390492483973503, -0.0011827163398265839, -0.0011263834312558174, -0.001070050522685051, -0.0010137176141142845, -0.0009573847055435181, -0.0009010517969727516, -0.0008447188884019852, -0.0007883859798312187, -0.0007320530712604523, -0.0006757201626896858, -0.0006193872541189194, -0.0005630543455481529, -0.0005067214369773865, -0.00045038852840662, -0.0003940556198358536, -0.00033772271126508713, -0.0002813898026943207, -0.00022505689412355423, -0.00016872398555278778, -0.00011239107698202133, -5.605816841125488e-05, 2.7474015951156616e-07, 5.6607648730278015e-05, 0.00011294055730104446, 0.0001692734658718109, 0.00022560637444257736, 0.0002819392830133438, 0.00033827219158411026, 0.0003946051001548767, 0.00045093800872564316, 0.0005072709172964096, 0.0005636038258671761, 0.0006199367344379425, 0.000676269643008709, 0.0007326025515794754, 0.0007889354601502419, 0.0008452683687210083, 0.0009016012772917747, 0.0009579341858625412, 0.0010142670944333076, 0.001070600003004074, 0.0011269329115748405, 0.001183265820145607, 0.0012395987287163734, 0.00129593163728714, 0.0013522645458579063, 0.0014085974544286728, 0.0014649303629994392, 0.0015212632715702057, 0.0015775961801409721, 0.0016339290887117386, 0.001690261997282505, 0.0017465949058532715]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 11.0, 10.0, 12.0, 19.0, 19.0, 19.0, 19.0, 24.0, 28.0, 29.0, 30.0, 49.0, 44.0, 56.0, 46.0, 46.0, 47.0, 38.0, 50.0, 47.0, 31.0, 35.0, 31.0, 30.0, 27.0, 29.0, 19.0, 32.0, 22.0, 15.0, 17.0, 14.0, 10.0, 6.0, 7.0, 5.0, 5.0, 2.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.15625, -17.6353759765625, -17.114501953125, -16.5936279296875, -16.07275390625, -15.5518798828125, -15.031005859375, -14.5101318359375, -13.9892578125, -13.4683837890625, -12.947509765625, -12.4266357421875, -11.90576171875, -11.3848876953125, -10.864013671875, -10.3431396484375, -9.822265625, -9.3013916015625, -8.780517578125, -8.2596435546875, -7.73876953125, -7.2178955078125, -6.697021484375, -6.1761474609375, -5.6552734375, -5.1343994140625, -4.613525390625, -4.0926513671875, -3.57177734375, -3.0509033203125, -2.530029296875, -2.0091552734375, -1.48828125, -0.9674072265625, -0.446533203125, 0.0743408203125, 0.59521484375, 1.1160888671875, 1.636962890625, 2.1578369140625, 2.6787109375, 3.1995849609375, 3.720458984375, 4.2413330078125, 4.76220703125, 5.2830810546875, 5.803955078125, 6.3248291015625, 6.845703125, 7.3665771484375, 7.887451171875, 8.4083251953125, 8.92919921875, 9.4500732421875, 9.970947265625, 10.4918212890625, 11.0126953125, 11.5335693359375, 12.054443359375, 12.5753173828125, 13.09619140625, 13.6170654296875, 14.137939453125, 14.6588134765625, 15.1796875]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 0.0, 8.0, 5.0, 16.0, 15.0, 17.0, 33.0, 31.0, 60.0, 87.0, 110.0, 192.0, 261.0, 432.0, 662.0, 1048.0, 1796.0, 3158.0, 5856.0, 11656.0, 25870.0, 63493.0, 182278.0, 440552.0, 191722.0, 66572.0, 26393.0, 11916.0, 6039.0, 3251.0, 1884.0, 1115.0, 698.0, 449.0, 282.0, 186.0, 141.0, 89.0, 57.0, 33.0, 21.0, 20.0, 14.0, 14.0, 16.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.59765625, -7.35662841796875, -7.1156005859375, -6.87457275390625, -6.633544921875, -6.39251708984375, -6.1514892578125, -5.91046142578125, -5.66943359375, -5.42840576171875, -5.1873779296875, -4.94635009765625, -4.705322265625, -4.46429443359375, -4.2232666015625, -3.98223876953125, -3.7412109375, -3.50018310546875, -3.2591552734375, -3.01812744140625, -2.777099609375, -2.53607177734375, -2.2950439453125, -2.05401611328125, -1.81298828125, -1.57196044921875, -1.3309326171875, -1.08990478515625, -0.848876953125, -0.60784912109375, -0.3668212890625, -0.12579345703125, 0.115234375, 0.35626220703125, 0.5972900390625, 0.83831787109375, 1.079345703125, 1.32037353515625, 1.5614013671875, 1.80242919921875, 2.04345703125, 2.28448486328125, 2.5255126953125, 2.76654052734375, 3.007568359375, 3.24859619140625, 3.4896240234375, 3.73065185546875, 3.9716796875, 4.21270751953125, 4.4537353515625, 4.69476318359375, 4.935791015625, 5.17681884765625, 5.4178466796875, 5.65887451171875, 5.89990234375, 6.14093017578125, 6.3819580078125, 6.62298583984375, 6.864013671875, 7.10504150390625, 7.3460693359375, 7.58709716796875, 7.828125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 5.0, 3.0, 6.0, 9.0, 9.0, 12.0, 12.0, 18.0, 14.0, 27.0, 25.0, 34.0, 31.0, 32.0, 36.0, 44.0, 39.0, 37.0, 71.0, 466.0, 1618.0, 59.0, 57.0, 60.0, 44.0, 35.0, 27.0, 32.0, 26.0, 32.0, 19.0, 19.0, 22.0, 12.0, 7.0, 5.0, 6.0, 8.0, 4.0, 3.0, 6.0, 1.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.375, -53.64697265625, -51.9189453125, -50.19091796875, -48.462890625, -46.73486328125, -45.0068359375, -43.27880859375, -41.55078125, -39.82275390625, -38.0947265625, -36.36669921875, -34.638671875, -32.91064453125, -31.1826171875, -29.45458984375, -27.7265625, -25.99853515625, -24.2705078125, -22.54248046875, -20.814453125, -19.08642578125, -17.3583984375, -15.63037109375, -13.90234375, -12.17431640625, -10.4462890625, -8.71826171875, -6.990234375, -5.26220703125, -3.5341796875, -1.80615234375, -0.078125, 1.64990234375, 3.3779296875, 5.10595703125, 6.833984375, 8.56201171875, 10.2900390625, 12.01806640625, 13.74609375, 15.47412109375, 17.2021484375, 18.93017578125, 20.658203125, 22.38623046875, 24.1142578125, 25.84228515625, 27.5703125, 29.29833984375, 31.0263671875, 32.75439453125, 34.482421875, 36.21044921875, 37.9384765625, 39.66650390625, 41.39453125, 43.12255859375, 44.8505859375, 46.57861328125, 48.306640625, 50.03466796875, 51.7626953125, 53.49072265625, 55.21875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 1.0, 5.0, 4.0, 4.0, 7.0, 10.0, 5.0, 13.0, 20.0, 29.0, 25.0, 33.0, 65.0, 51.0, 69.0, 93.0, 133.0, 167.0, 214.0, 505.0, 2503.0, 3036197.0, 102984.0, 1236.0, 373.0, 242.0, 148.0, 135.0, 85.0, 66.0, 65.0, 50.0, 43.0, 24.0, 25.0, 15.0, 12.0, 10.0, 12.0, 5.0, 2.0, 7.0, 8.0, 3.0, 5.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-131.5, -127.37109375, -123.2421875, -119.11328125, -114.984375, -110.85546875, -106.7265625, -102.59765625, -98.46875, -94.33984375, -90.2109375, -86.08203125, -81.953125, -77.82421875, -73.6953125, -69.56640625, -65.4375, -61.30859375, -57.1796875, -53.05078125, -48.921875, -44.79296875, -40.6640625, -36.53515625, -32.40625, -28.27734375, -24.1484375, -20.01953125, -15.890625, -11.76171875, -7.6328125, -3.50390625, 0.625, 4.75390625, 8.8828125, 13.01171875, 17.140625, 21.26953125, 25.3984375, 29.52734375, 33.65625, 37.78515625, 41.9140625, 46.04296875, 50.171875, 54.30078125, 58.4296875, 62.55859375, 66.6875, 70.81640625, 74.9453125, 79.07421875, 83.203125, 87.33203125, 91.4609375, 95.58984375, 99.71875, 103.84765625, 107.9765625, 112.10546875, 116.234375, 120.36328125, 124.4921875, 128.62109375, 132.75]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [3.0, 10.0, 109.0, 371.0, 394.0, 106.0, 18.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.088746070861816, -9.832451820373535, -6.576157569885254, -3.3198633193969727, -0.0635690689086914, 3.19272518157959, 6.449019432067871, 9.705313682556152, 12.961607933044434, 16.21790313720703, 19.474197387695312, 22.730491638183594, 25.986785888671875, 29.243080139160156, 32.49937438964844, 35.75566864013672, 39.011962890625, 42.26825714111328, 45.52455139160156, 48.780845642089844, 52.037139892578125, 55.293434143066406, 58.54972839355469, 61.80602264404297, 65.06231689453125, 68.31861114501953, 71.57490539550781, 74.8311996459961, 78.08749389648438, 81.34378814697266, 84.60008239746094, 87.85637664794922, 91.1126708984375, 94.36896514892578, 97.62525939941406, 100.88155364990234, 104.13784790039062, 107.3941421508789, 110.65043640136719, 113.90673065185547, 117.16302490234375, 120.41931915283203, 123.67561340332031, 126.9319076538086, 130.18820190429688, 133.44448852539062, 136.70079040527344, 139.95709228515625, 143.21337890625, 146.46966552734375, 149.72596740722656, 152.98226928710938, 156.23855590820312, 159.49484252929688, 162.7511444091797, 166.0074462890625, 169.26373291015625, 172.52001953125, 175.7763214111328, 179.03262329101562, 182.28890991210938, 185.54519653320312, 188.80149841308594, 192.05780029296875, 195.3140869140625]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 18.0, 20.0, 15.0, 18.0, 30.0, 27.0, 32.0, 47.0, 42.0, 42.0, 51.0, 61.0, 57.0, 42.0, 48.0, 41.0, 44.0, 40.0, 40.0, 49.0, 43.0, 20.0, 21.0, 22.0, 21.0, 22.0, 7.0, 16.0, 8.0, 13.0, 4.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.9167938232422, -140.2230682373047, -135.52932739257812, -130.83560180664062, -126.14186096191406, -121.44812774658203, -116.75439453125, -112.0606689453125, -107.36692810058594, -102.6731948852539, -97.97946166992188, -93.28572845458984, -88.59199523925781, -83.89826202392578, -79.20452880859375, -74.51080322265625, -69.81707000732422, -65.12333679199219, -60.429603576660156, -55.735870361328125, -51.042137145996094, -46.34840393066406, -41.6546745300293, -36.960941314697266, -32.267208099365234, -27.573474884033203, -22.879741668701172, -18.186010360717773, -13.492277145385742, -8.798543930053711, -4.1048126220703125, 0.5889205932617188, 5.28265380859375, 9.976387023925781, 14.670119285583496, 19.36385154724121, 24.057584762573242, 28.751317977905273, 33.44504928588867, 38.1387825012207, 42.832515716552734, 47.526248931884766, 52.2199821472168, 56.91371154785156, 61.607444763183594, 66.30117797851562, 70.99491119384766, 75.68864440917969, 80.38237762451172, 85.07611083984375, 89.76984405517578, 94.46357727050781, 99.15731048583984, 103.85104370117188, 108.54476928710938, 113.23851013183594, 117.93223571777344, 122.62596893310547, 127.3197021484375, 132.013427734375, 136.70716857910156, 141.40089416503906, 146.09463500976562, 150.78836059570312, 155.4821014404297]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 7.0, 2.0, 11.0, 14.0, 16.0, 19.0, 15.0, 13.0, 21.0, 30.0, 33.0, 25.0, 37.0, 63.0, 42.0, 44.0, 41.0, 52.0, 53.0, 41.0, 44.0, 37.0, 35.0, 30.0, 35.0, 28.0, 26.0, 23.0, 30.0, 28.0, 22.0, 15.0, 15.0, 10.0, 9.0, 11.0, 3.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.609375, -18.0697021484375, -17.530029296875, -16.9903564453125, -16.45068359375, -15.9110107421875, -15.371337890625, -14.8316650390625, -14.2919921875, -13.7523193359375, -13.212646484375, -12.6729736328125, -12.13330078125, -11.5936279296875, -11.053955078125, -10.5142822265625, -9.974609375, -9.4349365234375, -8.895263671875, -8.3555908203125, -7.81591796875, -7.2762451171875, -6.736572265625, -6.1968994140625, -5.6572265625, -5.1175537109375, -4.577880859375, -4.0382080078125, -3.49853515625, -2.9588623046875, -2.419189453125, -1.8795166015625, -1.33984375, -0.8001708984375, -0.260498046875, 0.2791748046875, 0.81884765625, 1.3585205078125, 1.898193359375, 2.4378662109375, 2.9775390625, 3.5172119140625, 4.056884765625, 4.5965576171875, 5.13623046875, 5.6759033203125, 6.215576171875, 6.7552490234375, 7.294921875, 7.8345947265625, 8.374267578125, 8.9139404296875, 9.45361328125, 9.9932861328125, 10.532958984375, 11.0726318359375, 11.6123046875, 12.1519775390625, 12.691650390625, 13.2313232421875, 13.77099609375, 14.3106689453125, 14.850341796875, 15.3900146484375, 15.9296875]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 6.0, 3.0, 13.0, 16.0, 22.0, 25.0, 31.0, 41.0, 59.0, 89.0, 132.0, 212.0, 371.0, 587.0, 1114.0, 2528.0, 7743.0, 165416.0, 3726214.0, 274234.0, 9503.0, 2847.0, 1273.0, 669.0, 366.0, 261.0, 164.0, 92.0, 66.0, 53.0, 27.0, 21.0, 21.0, 18.0, 8.0, 6.0, 5.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-66.9375, -65.00048828125, -63.0634765625, -61.12646484375, -59.189453125, -57.25244140625, -55.3154296875, -53.37841796875, -51.44140625, -49.50439453125, -47.5673828125, -45.63037109375, -43.693359375, -41.75634765625, -39.8193359375, -37.88232421875, -35.9453125, -34.00830078125, -32.0712890625, -30.13427734375, -28.197265625, -26.26025390625, -24.3232421875, -22.38623046875, -20.44921875, -18.51220703125, -16.5751953125, -14.63818359375, -12.701171875, -10.76416015625, -8.8271484375, -6.89013671875, -4.953125, -3.01611328125, -1.0791015625, 0.85791015625, 2.794921875, 4.73193359375, 6.6689453125, 8.60595703125, 10.54296875, 12.47998046875, 14.4169921875, 16.35400390625, 18.291015625, 20.22802734375, 22.1650390625, 24.10205078125, 26.0390625, 27.97607421875, 29.9130859375, 31.85009765625, 33.787109375, 35.72412109375, 37.6611328125, 39.59814453125, 41.53515625, 43.47216796875, 45.4091796875, 47.34619140625, 49.283203125, 51.22021484375, 53.1572265625, 55.09423828125, 57.03125]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 5.0, 8.0, 13.0, 16.0, 25.0, 36.0, 76.0, 215.0, 687.0, 1463.0, 982.0, 296.0, 121.0, 57.0, 33.0, 17.0, 10.0, 7.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.875, -40.896484375, -38.91796875, -36.939453125, -34.9609375, -32.982421875, -31.00390625, -29.025390625, -27.046875, -25.068359375, -23.08984375, -21.111328125, -19.1328125, -17.154296875, -15.17578125, -13.197265625, -11.21875, -9.240234375, -7.26171875, -5.283203125, -3.3046875, -1.326171875, 0.65234375, 2.630859375, 4.609375, 6.587890625, 8.56640625, 10.544921875, 12.5234375, 14.501953125, 16.48046875, 18.458984375, 20.4375, 22.416015625, 24.39453125, 26.373046875, 28.3515625, 30.330078125, 32.30859375, 34.287109375, 36.265625, 38.244140625, 40.22265625, 42.201171875, 44.1796875, 46.158203125, 48.13671875, 50.115234375, 52.09375, 54.072265625, 56.05078125, 58.029296875, 60.0078125, 61.986328125, 63.96484375, 65.943359375, 67.921875, 69.900390625, 71.87890625, 73.857421875, 75.8359375, 77.814453125, 79.79296875, 81.771484375, 83.75]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 14.0, 24.0, 61.0, 162.0, 472.0, 2648.0, 1436765.0, 2750432.0, 2855.0, 549.0, 158.0, 52.0, 32.0, 14.0, 13.0, 11.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-359.25, -350.8984375, -342.546875, -334.1953125, -325.84375, -317.4921875, -309.140625, -300.7890625, -292.4375, -284.0859375, -275.734375, -267.3828125, -259.03125, -250.6796875, -242.328125, -233.9765625, -225.625, -217.2734375, -208.921875, -200.5703125, -192.21875, -183.8671875, -175.515625, -167.1640625, -158.8125, -150.4609375, -142.109375, -133.7578125, -125.40625, -117.0546875, -108.703125, -100.3515625, -92.0, -83.6484375, -75.296875, -66.9453125, -58.59375, -50.2421875, -41.890625, -33.5390625, -25.1875, -16.8359375, -8.484375, -0.1328125, 8.21875, 16.5703125, 24.921875, 33.2734375, 41.625, 49.9765625, 58.328125, 66.6796875, 75.03125, 83.3828125, 91.734375, 100.0859375, 108.4375, 116.7890625, 125.140625, 133.4921875, 141.84375, 150.1953125, 158.546875, 166.8984375, 175.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 15.0, 74.0, 320.0, 466.0, 108.0, 21.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-570.9967041015625, -554.743408203125, -538.4900512695312, -522.2367553710938, -505.9834289550781, -489.7301025390625, -473.4767761230469, -457.22344970703125, -440.97015380859375, -424.7168273925781, -408.4635009765625, -392.210205078125, -375.9568786621094, -359.70355224609375, -343.4502258300781, -327.1968994140625, -310.9435729980469, -294.69024658203125, -278.4369201660156, -262.18359375, -245.9302978515625, -229.67697143554688, -213.42364501953125, -197.17031860351562, -180.91700744628906, -164.66368103027344, -148.41036987304688, -132.15704345703125, -115.90372467041016, -99.65040588378906, -83.39707946777344, -67.14376068115234, -50.890411376953125, -34.63709259033203, -18.383769989013672, -2.1304473876953125, 14.122871398925781, 30.376190185546875, 46.6295166015625, 62.882835388183594, 79.13615417480469, 95.38947296142578, 111.64279174804688, 127.8961181640625, 144.14944458007812, 160.4027557373047, 176.6560821533203, 192.90939331054688, 209.1627197265625, 225.41604614257812, 241.6693572998047, 257.92266845703125, 274.1759948730469, 290.4293212890625, 306.6826477050781, 322.93597412109375, 339.18927001953125, 355.4425964355469, 371.6959228515625, 387.94921875, 404.2025451660156, 420.45587158203125, 436.7091979980469, 452.9625244140625, 469.2158508300781]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 7.0, 7.0, 2.0, 8.0, 8.0, 16.0, 12.0, 12.0, 24.0, 19.0, 24.0, 29.0, 27.0, 26.0, 29.0, 35.0, 26.0, 28.0, 38.0, 32.0, 33.0, 38.0, 39.0, 26.0, 42.0, 34.0, 41.0, 36.0, 29.0, 34.0, 27.0, 20.0, 39.0, 21.0, 23.0, 7.0, 21.0, 11.0, 13.0, 9.0, 7.0, 8.0, 10.0, 7.0, 5.0, 3.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0], "bins": [-80.2331314086914, -77.7298583984375, -75.22657775878906, -72.72330474853516, -70.22003173828125, -67.71675109863281, -65.2134780883789, -62.710201263427734, -60.20692443847656, -57.70364761352539, -55.20037078857422, -52.69709777832031, -50.19382095336914, -47.69054412841797, -45.18727111816406, -42.68399429321289, -40.18071746826172, -37.67744064331055, -35.174163818359375, -32.67089080810547, -30.167613983154297, -27.664337158203125, -25.161062240600586, -22.657787322998047, -20.154510498046875, -17.651233673095703, -15.147958755493164, -12.644682884216309, -10.141407012939453, -7.638131141662598, -5.134855270385742, -2.631580352783203, -0.1283111572265625, 2.374964714050293, 4.878240585327148, 7.381516456604004, 9.88479232788086, 12.388068199157715, 14.89134407043457, 17.39461898803711, 19.89789581298828, 22.401172637939453, 24.904447555541992, 27.40772247314453, 29.910999298095703, 32.414276123046875, 34.91754913330078, 37.42082595825195, 39.924102783203125, 42.4273796081543, 44.93065643310547, 47.433929443359375, 49.93720626831055, 52.44048309326172, 54.943756103515625, 57.4470329284668, 59.95030975341797, 62.45358657836914, 64.95686340332031, 67.46013641357422, 69.96340942382812, 72.46669006347656, 74.96996307373047, 77.47323608398438, 79.97651672363281]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 8.0, 6.0, 8.0, 10.0, 12.0, 14.0, 15.0, 27.0, 26.0, 20.0, 44.0, 36.0, 30.0, 35.0, 44.0, 49.0, 48.0, 44.0, 48.0, 46.0, 38.0, 41.0, 44.0, 36.0, 32.0, 39.0, 17.0, 24.0, 28.0, 21.0, 18.0, 16.0, 8.0, 12.0, 12.0, 10.0, 4.0, 4.0, 9.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.34375, -17.77685546875, -17.2099609375, -16.64306640625, -16.076171875, -15.50927734375, -14.9423828125, -14.37548828125, -13.80859375, -13.24169921875, -12.6748046875, -12.10791015625, -11.541015625, -10.97412109375, -10.4072265625, -9.84033203125, -9.2734375, -8.70654296875, -8.1396484375, -7.57275390625, -7.005859375, -6.43896484375, -5.8720703125, -5.30517578125, -4.73828125, -4.17138671875, -3.6044921875, -3.03759765625, -2.470703125, -1.90380859375, -1.3369140625, -0.77001953125, -0.203125, 0.36376953125, 0.9306640625, 1.49755859375, 2.064453125, 2.63134765625, 3.1982421875, 3.76513671875, 4.33203125, 4.89892578125, 5.4658203125, 6.03271484375, 6.599609375, 7.16650390625, 7.7333984375, 8.30029296875, 8.8671875, 9.43408203125, 10.0009765625, 10.56787109375, 11.134765625, 11.70166015625, 12.2685546875, 12.83544921875, 13.40234375, 13.96923828125, 14.5361328125, 15.10302734375, 15.669921875, 16.23681640625, 16.8037109375, 17.37060546875, 17.9375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [6.0, 3.0, 2.0, 5.0, 7.0, 11.0, 19.0, 27.0, 33.0, 47.0, 60.0, 94.0, 119.0, 196.0, 248.0, 360.0, 538.0, 755.0, 1044.0, 1420.0, 2057.0, 3117.0, 4516.0, 6798.0, 10347.0, 15480.0, 24099.0, 38501.0, 63764.0, 110070.0, 203242.0, 234269.0, 129826.0, 73528.0, 43888.0, 27298.0, 17349.0, 11334.0, 7453.0, 5092.0, 3509.0, 2457.0, 1659.0, 1156.0, 772.0, 607.0, 420.0, 300.0, 213.0, 159.0, 81.0, 60.0, 44.0, 45.0, 18.0, 17.0, 18.0, 6.0, 1.0, 5.0, 4.0, 2.0, 0.0, 1.0], "bins": [-1.4267578125, -1.3809356689453125, -1.335113525390625, -1.2892913818359375, -1.24346923828125, -1.1976470947265625, -1.151824951171875, -1.1060028076171875, -1.0601806640625, -1.0143585205078125, -0.968536376953125, -0.9227142333984375, -0.87689208984375, -0.8310699462890625, -0.785247802734375, -0.7394256591796875, -0.693603515625, -0.6477813720703125, -0.601959228515625, -0.5561370849609375, -0.51031494140625, -0.4644927978515625, -0.418670654296875, -0.3728485107421875, -0.3270263671875, -0.2812042236328125, -0.235382080078125, -0.1895599365234375, -0.14373779296875, -0.0979156494140625, -0.052093505859375, -0.0062713623046875, 0.03955078125, 0.0853729248046875, 0.131195068359375, 0.1770172119140625, 0.22283935546875, 0.2686614990234375, 0.314483642578125, 0.3603057861328125, 0.4061279296875, 0.4519500732421875, 0.497772216796875, 0.5435943603515625, 0.58941650390625, 0.6352386474609375, 0.681060791015625, 0.7268829345703125, 0.772705078125, 0.8185272216796875, 0.864349365234375, 0.9101715087890625, 0.95599365234375, 1.0018157958984375, 1.047637939453125, 1.0934600830078125, 1.1392822265625, 1.1851043701171875, 1.230926513671875, 1.2767486572265625, 1.32257080078125, 1.3683929443359375, 1.414215087890625, 1.4600372314453125, 1.505859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 2.0, 10.0, 7.0, 8.0, 14.0, 13.0, 27.0, 14.0, 15.0, 18.0, 22.0, 28.0, 22.0, 31.0, 33.0, 22.0, 40.0, 26.0, 37.0, 40.0, 33.0, 1054.0, 33.0, 34.0, 44.0, 33.0, 35.0, 41.0, 27.0, 22.0, 34.0, 23.0, 21.0, 17.0, 15.0, 27.0, 8.0, 17.0, 13.0, 8.0, 7.0, 6.0, 10.0, 10.0, 6.0, 0.0, 3.0, 3.0, 3.0, 4.0], "bins": [-10.90625, -10.597900390625, -10.28955078125, -9.981201171875, -9.6728515625, -9.364501953125, -9.05615234375, -8.747802734375, -8.439453125, -8.131103515625, -7.82275390625, -7.514404296875, -7.2060546875, -6.897705078125, -6.58935546875, -6.281005859375, -5.97265625, -5.664306640625, -5.35595703125, -5.047607421875, -4.7392578125, -4.430908203125, -4.12255859375, -3.814208984375, -3.505859375, -3.197509765625, -2.88916015625, -2.580810546875, -2.2724609375, -1.964111328125, -1.65576171875, -1.347412109375, -1.0390625, -0.730712890625, -0.42236328125, -0.114013671875, 0.1943359375, 0.502685546875, 0.81103515625, 1.119384765625, 1.427734375, 1.736083984375, 2.04443359375, 2.352783203125, 2.6611328125, 2.969482421875, 3.27783203125, 3.586181640625, 3.89453125, 4.202880859375, 4.51123046875, 4.819580078125, 5.1279296875, 5.436279296875, 5.74462890625, 6.052978515625, 6.361328125, 6.669677734375, 6.97802734375, 7.286376953125, 7.5947265625, 7.903076171875, 8.21142578125, 8.519775390625, 8.828125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 4.0, 9.0, 13.0, 15.0, 24.0, 33.0, 46.0, 47.0, 84.0, 130.0, 189.0, 288.0, 406.0, 666.0, 1086.0, 1658.0, 2509.0, 4073.0, 6462.0, 10636.0, 17317.0, 28824.0, 49752.0, 92425.0, 195833.0, 1345972.0, 155176.0, 76238.0, 42522.0, 25099.0, 15062.0, 8952.0, 5601.0, 3691.0, 2259.0, 1439.0, 888.0, 564.0, 354.0, 250.0, 176.0, 111.0, 72.0, 49.0, 49.0, 26.0, 18.0, 13.0, 8.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.5126953125, -1.4611663818359375, -1.409637451171875, -1.3581085205078125, -1.30657958984375, -1.2550506591796875, -1.203521728515625, -1.1519927978515625, -1.1004638671875, -1.0489349365234375, -0.997406005859375, -0.9458770751953125, -0.89434814453125, -0.8428192138671875, -0.791290283203125, -0.7397613525390625, -0.688232421875, -0.6367034912109375, -0.585174560546875, -0.5336456298828125, -0.48211669921875, -0.4305877685546875, -0.379058837890625, -0.3275299072265625, -0.2760009765625, -0.2244720458984375, -0.172943115234375, -0.1214141845703125, -0.06988525390625, -0.0183563232421875, 0.033172607421875, 0.0847015380859375, 0.13623046875, 0.1877593994140625, 0.239288330078125, 0.2908172607421875, 0.34234619140625, 0.3938751220703125, 0.445404052734375, 0.4969329833984375, 0.5484619140625, 0.5999908447265625, 0.651519775390625, 0.7030487060546875, 0.75457763671875, 0.8061065673828125, 0.857635498046875, 0.9091644287109375, 0.960693359375, 1.0122222900390625, 1.063751220703125, 1.1152801513671875, 1.16680908203125, 1.2183380126953125, 1.269866943359375, 1.3213958740234375, 1.3729248046875, 1.4244537353515625, 1.475982666015625, 1.5275115966796875, 1.57904052734375, 1.6305694580078125, 1.682098388671875, 1.7336273193359375, 1.78515625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 10.0, 13.0, 8.0, 15.0, 18.0, 17.0, 25.0, 28.0, 34.0, 40.0, 50.0, 50.0, 39.0, 66.0, 68.0, 47.0, 51.0, 58.0, 51.0, 47.0, 34.0, 45.0, 34.0, 22.0, 18.0, 29.0, 18.0, 10.0, 11.0, 14.0, 8.0, 3.0, 6.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004108428955078125, -0.003990143537521362, -0.0038718581199645996, -0.003753572702407837, -0.0036352872848510742, -0.0035170018672943115, -0.003398716449737549, -0.003280431032180786, -0.0031621456146240234, -0.0030438601970672607, -0.002925574779510498, -0.0028072893619537354, -0.0026890039443969727, -0.00257071852684021, -0.0024524331092834473, -0.0023341476917266846, -0.002215862274169922, -0.002097576856613159, -0.0019792914390563965, -0.0018610060214996338, -0.001742720603942871, -0.0016244351863861084, -0.0015061497688293457, -0.001387864351272583, -0.0012695789337158203, -0.0011512935161590576, -0.001033008098602295, -0.0009147226810455322, -0.0007964372634887695, -0.0006781518459320068, -0.0005598664283752441, -0.00044158101081848145, -0.00032329559326171875, -0.00020501017570495605, -8.672475814819336e-05, 3.1560659408569336e-05, 0.00014984607696533203, 0.0002681314945220947, 0.0003864169120788574, 0.0005047023296356201, 0.0006229877471923828, 0.0007412731647491455, 0.0008595585823059082, 0.000977843999862671, 0.0010961294174194336, 0.0012144148349761963, 0.001332700252532959, 0.0014509856700897217, 0.0015692710876464844, 0.001687556505203247, 0.0018058419227600098, 0.0019241273403167725, 0.002042412757873535, 0.002160698175430298, 0.0022789835929870605, 0.0023972690105438232, 0.002515554428100586, 0.0026338398456573486, 0.0027521252632141113, 0.002870410680770874, 0.0029886960983276367, 0.0031069815158843994, 0.003225266933441162, 0.003343552350997925, 0.0034618377685546875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 6.0, 6.0, 9.0, 17.0, 18.0, 17.0, 27.0, 39.0, 35.0, 52.0, 75.0, 90.0, 130.0, 240.0, 592.0, 7890.0, 1008689.0, 28831.0, 867.0, 286.0, 155.0, 109.0, 107.0, 57.0, 46.0, 42.0, 33.0, 15.0, 17.0, 14.0, 11.0, 10.0, 7.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07452392578125, -0.07191944122314453, -0.06931495666503906, -0.0667104721069336, -0.06410598754882812, -0.061501502990722656, -0.05889701843261719, -0.05629253387451172, -0.05368804931640625, -0.05108356475830078, -0.04847908020019531, -0.045874595642089844, -0.043270111083984375, -0.040665626525878906, -0.03806114196777344, -0.03545665740966797, -0.0328521728515625, -0.03024768829345703, -0.027643203735351562, -0.025038719177246094, -0.022434234619140625, -0.019829750061035156, -0.017225265502929688, -0.014620780944824219, -0.01201629638671875, -0.009411811828613281, -0.0068073272705078125, -0.004202842712402344, -0.001598358154296875, 0.0010061264038085938, 0.0036106109619140625, 0.006215095520019531, 0.008819580078125, 0.011424064636230469, 0.014028549194335938, 0.016633033752441406, 0.019237518310546875, 0.021842002868652344, 0.024446487426757812, 0.02705097198486328, 0.02965545654296875, 0.03225994110107422, 0.03486442565917969, 0.037468910217285156, 0.040073394775390625, 0.042677879333496094, 0.04528236389160156, 0.04788684844970703, 0.0504913330078125, 0.05309581756591797, 0.05570030212402344, 0.058304786682128906, 0.060909271240234375, 0.06351375579833984, 0.06611824035644531, 0.06872272491455078, 0.07132720947265625, 0.07393169403076172, 0.07653617858886719, 0.07914066314697266, 0.08174514770507812, 0.0843496322631836, 0.08695411682128906, 0.08955860137939453, 0.0921630859375]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [13.0, 55.0, 180.0, 409.0, 262.0, 70.0, 21.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0010161134414374828, -0.0007364110788330436, -0.0004567087162286043, -0.00017700635362416506, 0.0001026960089802742, 0.00038239837158471346, 0.0006621007341891527, 0.0009418032132089138, 0.0012215054593980312, 0.0015012078220024705, 0.0017809101846069098, 0.002060612663626671, 0.0023403149098157883, 0.0026200171560049057, 0.002899719635024667, 0.003179422114044428, 0.0034591243602335453, 0.0037388266064226627, 0.0040185293182730675, 0.004298231564462185, 0.004577933810651302, 0.00485763605684042, 0.005137338303029537, 0.005417041014879942, 0.005696743261069059, 0.005976445507258177, 0.0062561482191085815, 0.006535850465297699, 0.006815552711486816, 0.007095254957675934, 0.007374957203865051, 0.007654659915715456, 0.007934361696243286, 0.008214063942432404, 0.008493766188621521, 0.008773468434810638, 0.009053170680999756, 0.009332873858511448, 0.009612576104700565, 0.009892278350889683, 0.0101719805970788, 0.010451682843267918, 0.010731385089457035, 0.011011087335646152, 0.011290790513157845, 0.011570492759346962, 0.01185019500553608, 0.012129897251725197, 0.012409599497914314, 0.012689301744103432, 0.01296900399029255, 0.013248706236481667, 0.013528408482670784, 0.013808111660182476, 0.014087813906371593, 0.014367516152560711, 0.014647218398749828, 0.014926920644938946, 0.015206622891128063, 0.01548632513731718, 0.015766028314828873, 0.01604573056101799, 0.016325432807207108, 0.016605135053396225, 0.016884837299585342]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 4.0, 6.0, 4.0, 10.0, 8.0, 9.0, 13.0, 14.0, 24.0, 16.0, 24.0, 22.0, 21.0, 24.0, 35.0, 34.0, 34.0, 32.0, 35.0, 40.0, 44.0, 39.0, 34.0, 28.0, 31.0, 47.0, 26.0, 32.0, 35.0, 35.0, 28.0, 24.0, 21.0, 17.0, 21.0, 22.0, 22.0, 14.0, 16.0, 12.0, 8.0, 8.0, 7.0, 3.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0018063783645629883, -0.0017489558085799217, -0.0016915332525968552, -0.0016341106966137886, -0.001576688140630722, -0.0015192655846476555, -0.001461843028664589, -0.0014044204726815224, -0.0013469979166984558, -0.0012895753607153893, -0.0012321528047323227, -0.0011747302487492561, -0.0011173076927661896, -0.001059885136783123, -0.0010024625808000565, -0.0009450400248169899, -0.0008876174688339233, -0.0008301949128508568, -0.0007727723568677902, -0.0007153498008847237, -0.0006579272449016571, -0.0006005046889185905, -0.000543082132935524, -0.00048565957695245743, -0.00042823702096939087, -0.0003708144649863243, -0.00031339190900325775, -0.0002559693530201912, -0.00019854679703712463, -0.00014112424105405807, -8.370168507099152e-05, -2.6279129087924957e-05, 3.11434268951416e-05, 8.856598287820816e-05, 0.00014598853886127472, 0.00020341109484434128, 0.00026083365082740784, 0.0003182562068104744, 0.00037567876279354095, 0.0004331013187766075, 0.0004905238747596741, 0.0005479464307427406, 0.0006053689867258072, 0.0006627915427088737, 0.0007202140986919403, 0.0007776366546750069, 0.0008350592106580734, 0.00089248176664114, 0.0009499043226242065, 0.001007326878607273, 0.0010647494345903397, 0.0011221719905734062, 0.0011795945465564728, 0.0012370171025395393, 0.001294439658522606, 0.0013518622145056725, 0.001409284770488739, 0.0014667073264718056, 0.0015241298824548721, 0.0015815524384379387, 0.0016389749944210052, 0.0016963975504040718, 0.0017538201063871384, 0.001811242662370205, 0.0018686652183532715]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 5.0, 4.0, 5.0, 8.0, 6.0, 8.0, 10.0, 12.0, 14.0, 15.0, 27.0, 26.0, 20.0, 44.0, 36.0, 30.0, 35.0, 44.0, 49.0, 48.0, 44.0, 48.0, 46.0, 38.0, 41.0, 44.0, 36.0, 32.0, 39.0, 17.0, 24.0, 28.0, 21.0, 18.0, 16.0, 8.0, 12.0, 12.0, 10.0, 4.0, 4.0, 9.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.34375, -17.77685546875, -17.2099609375, -16.64306640625, -16.076171875, -15.50927734375, -14.9423828125, -14.37548828125, -13.80859375, -13.24169921875, -12.6748046875, -12.10791015625, -11.541015625, -10.97412109375, -10.4072265625, -9.84033203125, -9.2734375, -8.70654296875, -8.1396484375, -7.57275390625, -7.005859375, -6.43896484375, -5.8720703125, -5.30517578125, -4.73828125, -4.17138671875, -3.6044921875, -3.03759765625, -2.470703125, -1.90380859375, -1.3369140625, -0.77001953125, -0.203125, 0.36376953125, 0.9306640625, 1.49755859375, 2.064453125, 2.63134765625, 3.1982421875, 3.76513671875, 4.33203125, 4.89892578125, 5.4658203125, 6.03271484375, 6.599609375, 7.16650390625, 7.7333984375, 8.30029296875, 8.8671875, 9.43408203125, 10.0009765625, 10.56787109375, 11.134765625, 11.70166015625, 12.2685546875, 12.83544921875, 13.40234375, 13.96923828125, 14.5361328125, 15.10302734375, 15.669921875, 16.23681640625, 16.8037109375, 17.37060546875, 17.9375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 2.0, 3.0, 6.0, 6.0, 7.0, 14.0, 11.0, 21.0, 15.0, 26.0, 37.0, 45.0, 69.0, 100.0, 116.0, 198.0, 293.0, 454.0, 839.0, 1750.0, 4384.0, 15780.0, 82790.0, 657495.0, 237780.0, 32716.0, 7969.0, 2751.0, 1173.0, 561.0, 332.0, 224.0, 161.0, 107.0, 72.0, 60.0, 48.0, 34.0, 25.0, 19.0, 22.0, 9.0, 13.0, 7.0, 4.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-19.625, -19.025634765625, -18.42626953125, -17.826904296875, -17.2275390625, -16.628173828125, -16.02880859375, -15.429443359375, -14.830078125, -14.230712890625, -13.63134765625, -13.031982421875, -12.4326171875, -11.833251953125, -11.23388671875, -10.634521484375, -10.03515625, -9.435791015625, -8.83642578125, -8.237060546875, -7.6376953125, -7.038330078125, -6.43896484375, -5.839599609375, -5.240234375, -4.640869140625, -4.04150390625, -3.442138671875, -2.8427734375, -2.243408203125, -1.64404296875, -1.044677734375, -0.4453125, 0.154052734375, 0.75341796875, 1.352783203125, 1.9521484375, 2.551513671875, 3.15087890625, 3.750244140625, 4.349609375, 4.948974609375, 5.54833984375, 6.147705078125, 6.7470703125, 7.346435546875, 7.94580078125, 8.545166015625, 9.14453125, 9.743896484375, 10.34326171875, 10.942626953125, 11.5419921875, 12.141357421875, 12.74072265625, 13.340087890625, 13.939453125, 14.538818359375, 15.13818359375, 15.737548828125, 16.3369140625, 16.936279296875, 17.53564453125, 18.135009765625, 18.734375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 5.0, 12.0, 6.0, 12.0, 18.0, 16.0, 17.0, 29.0, 19.0, 12.0, 29.0, 31.0, 44.0, 40.0, 52.0, 58.0, 59.0, 232.0, 1768.0, 109.0, 76.0, 51.0, 36.0, 40.0, 34.0, 33.0, 29.0, 19.0, 20.0, 27.0, 19.0, 13.0, 19.0, 15.0, 10.0, 9.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-54.4375, -52.69775390625, -50.9580078125, -49.21826171875, -47.478515625, -45.73876953125, -43.9990234375, -42.25927734375, -40.51953125, -38.77978515625, -37.0400390625, -35.30029296875, -33.560546875, -31.82080078125, -30.0810546875, -28.34130859375, -26.6015625, -24.86181640625, -23.1220703125, -21.38232421875, -19.642578125, -17.90283203125, -16.1630859375, -14.42333984375, -12.68359375, -10.94384765625, -9.2041015625, -7.46435546875, -5.724609375, -3.98486328125, -2.2451171875, -0.50537109375, 1.234375, 2.97412109375, 4.7138671875, 6.45361328125, 8.193359375, 9.93310546875, 11.6728515625, 13.41259765625, 15.15234375, 16.89208984375, 18.6318359375, 20.37158203125, 22.111328125, 23.85107421875, 25.5908203125, 27.33056640625, 29.0703125, 30.81005859375, 32.5498046875, 34.28955078125, 36.029296875, 37.76904296875, 39.5087890625, 41.24853515625, 42.98828125, 44.72802734375, 46.4677734375, 48.20751953125, 49.947265625, 51.68701171875, 53.4267578125, 55.16650390625, 56.90625]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 6.0, 4.0, 7.0, 11.0, 16.0, 11.0, 27.0, 25.0, 31.0, 46.0, 47.0, 59.0, 74.0, 108.0, 143.0, 185.0, 280.0, 657.0, 3517.0, 2967429.0, 169509.0, 2048.0, 513.0, 258.0, 160.0, 132.0, 88.0, 49.0, 47.0, 67.0, 29.0, 30.0, 17.0, 18.0, 15.0, 15.0, 8.0, 6.0, 4.0, 6.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.75, -111.7421875, -107.734375, -103.7265625, -99.71875, -95.7109375, -91.703125, -87.6953125, -83.6875, -79.6796875, -75.671875, -71.6640625, -67.65625, -63.6484375, -59.640625, -55.6328125, -51.625, -47.6171875, -43.609375, -39.6015625, -35.59375, -31.5859375, -27.578125, -23.5703125, -19.5625, -15.5546875, -11.546875, -7.5390625, -3.53125, 0.4765625, 4.484375, 8.4921875, 12.5, 16.5078125, 20.515625, 24.5234375, 28.53125, 32.5390625, 36.546875, 40.5546875, 44.5625, 48.5703125, 52.578125, 56.5859375, 60.59375, 64.6015625, 68.609375, 72.6171875, 76.625, 80.6328125, 84.640625, 88.6484375, 92.65625, 96.6640625, 100.671875, 104.6796875, 108.6875, 112.6953125, 116.703125, 120.7109375, 124.71875, 128.7265625, 132.734375, 136.7421875, 140.75]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 7.0, 14.0, 36.0, 110.0, 220.0, 264.0, 201.0, 86.0, 42.0, 20.0, 10.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.502197265625, -94.11457061767578, -91.72693634033203, -89.33930969238281, -86.95167541503906, -84.56404876708984, -82.17642211914062, -79.78878784179688, -77.40116119384766, -75.01353454589844, -72.62590026855469, -70.23827362060547, -67.85064697265625, -65.4630126953125, -63.07538604736328, -60.6877555847168, -58.30012512207031, -55.91249465942383, -53.524864196777344, -51.137237548828125, -48.74960708618164, -46.361976623535156, -43.97434997558594, -41.58671951293945, -39.19908905029297, -36.811458587646484, -34.423828125, -32.03620147705078, -29.648571014404297, -27.260940551757812, -24.87331199645996, -22.48568344116211, -20.098052978515625, -17.71042251586914, -15.322793960571289, -12.935164451599121, -10.547534942626953, -8.159905433654785, -5.772275924682617, -3.3846473693847656, -0.9970169067382812, 1.3906126022338867, 3.7782421112060547, 6.165871620178223, 8.55350112915039, 10.941130638122559, 13.328760147094727, 15.716388702392578, 18.104019165039062, 20.491649627685547, 22.8792781829834, 25.26690673828125, 27.654537200927734, 30.04216766357422, 32.42979431152344, 34.81742477416992, 37.205055236816406, 39.59268569946289, 41.980316162109375, 44.367942810058594, 46.75557327270508, 49.14320373535156, 51.53083038330078, 53.918460845947266, 56.30609130859375]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 11.0, 8.0, 15.0, 14.0, 16.0, 20.0, 21.0, 26.0, 27.0, 38.0, 35.0, 45.0, 46.0, 48.0, 47.0, 41.0, 58.0, 56.0, 44.0, 43.0, 36.0, 36.0, 34.0, 36.0, 24.0, 22.0, 15.0, 24.0, 23.0, 21.0, 10.0, 11.0, 8.0, 5.0, 4.0, 6.0, 7.0, 6.0, 3.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0], "bins": [-165.5044708251953, -160.8925323486328, -156.2805938720703, -151.6686553955078, -147.05673217773438, -142.44479370117188, -137.83285522460938, -133.22091674804688, -128.60897827148438, -123.99703979492188, -119.38510131835938, -114.7731704711914, -110.1612319946289, -105.5492935180664, -100.93736267089844, -96.32542419433594, -91.71348571777344, -87.10154724121094, -82.48960876464844, -77.87767791748047, -73.26573944091797, -68.65380096435547, -64.0418701171875, -59.429931640625, -54.8179931640625, -50.2060546875, -45.594120025634766, -40.98218536376953, -36.37024688720703, -31.758310317993164, -27.146373748779297, -22.534439086914062, -17.9224853515625, -13.310548782348633, -8.698612213134766, -4.086675643920898, 0.5252609252929688, 5.137197494506836, 9.749134063720703, 14.361068725585938, 18.973007202148438, 23.584943771362305, 28.196880340576172, 32.808815002441406, 37.420753479003906, 42.032691955566406, 46.64462661743164, 51.256561279296875, 55.868499755859375, 60.480438232421875, 65.09237670898438, 69.70430755615234, 74.31624603271484, 78.92818450927734, 83.54011535644531, 88.15205383300781, 92.76399230957031, 97.37593078613281, 101.98786926269531, 106.59980010986328, 111.21173858642578, 115.82367706298828, 120.43560791015625, 125.04754638671875, 129.65948486328125]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 4.0, 6.0, 5.0, 12.0, 8.0, 12.0, 11.0, 17.0, 25.0, 18.0, 38.0, 31.0, 39.0, 34.0, 36.0, 49.0, 45.0, 56.0, 46.0, 41.0, 48.0, 43.0, 52.0, 46.0, 36.0, 35.0, 33.0, 17.0, 29.0, 27.0, 17.0, 15.0, 13.0, 14.0, 5.0, 6.0, 9.0, 7.0, 6.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.953125, -19.332763671875, -18.71240234375, -18.092041015625, -17.4716796875, -16.851318359375, -16.23095703125, -15.610595703125, -14.990234375, -14.369873046875, -13.74951171875, -13.129150390625, -12.5087890625, -11.888427734375, -11.26806640625, -10.647705078125, -10.02734375, -9.406982421875, -8.78662109375, -8.166259765625, -7.5458984375, -6.925537109375, -6.30517578125, -5.684814453125, -5.064453125, -4.444091796875, -3.82373046875, -3.203369140625, -2.5830078125, -1.962646484375, -1.34228515625, -0.721923828125, -0.1015625, 0.518798828125, 1.13916015625, 1.759521484375, 2.3798828125, 3.000244140625, 3.62060546875, 4.240966796875, 4.861328125, 5.481689453125, 6.10205078125, 6.722412109375, 7.3427734375, 7.963134765625, 8.58349609375, 9.203857421875, 9.82421875, 10.444580078125, 11.06494140625, 11.685302734375, 12.3056640625, 12.926025390625, 13.54638671875, 14.166748046875, 14.787109375, 15.407470703125, 16.02783203125, 16.648193359375, 17.2685546875, 17.888916015625, 18.50927734375, 19.129638671875, 19.75]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 1.0, 7.0, 5.0, 6.0, 9.0, 8.0, 10.0, 17.0, 13.0, 23.0, 38.0, 58.0, 60.0, 95.0, 148.0, 227.0, 430.0, 869.0, 2165.0, 8759.0, 1506329.0, 2658936.0, 11445.0, 2413.0, 945.0, 477.0, 283.0, 135.0, 109.0, 75.0, 32.0, 36.0, 23.0, 23.0, 18.0, 12.0, 12.0, 6.0, 3.0, 6.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-90.5, -87.6767578125, -84.853515625, -82.0302734375, -79.20703125, -76.3837890625, -73.560546875, -70.7373046875, -67.9140625, -65.0908203125, -62.267578125, -59.4443359375, -56.62109375, -53.7978515625, -50.974609375, -48.1513671875, -45.328125, -42.5048828125, -39.681640625, -36.8583984375, -34.03515625, -31.2119140625, -28.388671875, -25.5654296875, -22.7421875, -19.9189453125, -17.095703125, -14.2724609375, -11.44921875, -8.6259765625, -5.802734375, -2.9794921875, -0.15625, 2.6669921875, 5.490234375, 8.3134765625, 11.13671875, 13.9599609375, 16.783203125, 19.6064453125, 22.4296875, 25.2529296875, 28.076171875, 30.8994140625, 33.72265625, 36.5458984375, 39.369140625, 42.1923828125, 45.015625, 47.8388671875, 50.662109375, 53.4853515625, 56.30859375, 59.1318359375, 61.955078125, 64.7783203125, 67.6015625, 70.4248046875, 73.248046875, 76.0712890625, 78.89453125, 81.7177734375, 84.541015625, 87.3642578125, 90.1875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 10.0, 6.0, 10.0, 18.0, 11.0, 32.0, 40.0, 63.0, 134.0, 307.0, 727.0, 1257.0, 818.0, 359.0, 142.0, 46.0, 25.0, 23.0, 15.0, 14.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-64.25, -62.5830078125, -60.916015625, -59.2490234375, -57.58203125, -55.9150390625, -54.248046875, -52.5810546875, -50.9140625, -49.2470703125, -47.580078125, -45.9130859375, -44.24609375, -42.5791015625, -40.912109375, -39.2451171875, -37.578125, -35.9111328125, -34.244140625, -32.5771484375, -30.91015625, -29.2431640625, -27.576171875, -25.9091796875, -24.2421875, -22.5751953125, -20.908203125, -19.2412109375, -17.57421875, -15.9072265625, -14.240234375, -12.5732421875, -10.90625, -9.2392578125, -7.572265625, -5.9052734375, -4.23828125, -2.5712890625, -0.904296875, 0.7626953125, 2.4296875, 4.0966796875, 5.763671875, 7.4306640625, 9.09765625, 10.7646484375, 12.431640625, 14.0986328125, 15.765625, 17.4326171875, 19.099609375, 20.7666015625, 22.43359375, 24.1005859375, 25.767578125, 27.4345703125, 29.1015625, 30.7685546875, 32.435546875, 34.1025390625, 35.76953125, 37.4365234375, 39.103515625, 40.7705078125, 42.4375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 5.0, 4.0, 14.0, 15.0, 24.0, 38.0, 73.0, 243.0, 832.0, 7218.0, 4039468.0, 142699.0, 2782.0, 487.0, 181.0, 83.0, 35.0, 24.0, 22.0, 9.0, 11.0, 9.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-205.625, -197.662109375, -189.69921875, -181.736328125, -173.7734375, -165.810546875, -157.84765625, -149.884765625, -141.921875, -133.958984375, -125.99609375, -118.033203125, -110.0703125, -102.107421875, -94.14453125, -86.181640625, -78.21875, -70.255859375, -62.29296875, -54.330078125, -46.3671875, -38.404296875, -30.44140625, -22.478515625, -14.515625, -6.552734375, 1.41015625, 9.373046875, 17.3359375, 25.298828125, 33.26171875, 41.224609375, 49.1875, 57.150390625, 65.11328125, 73.076171875, 81.0390625, 89.001953125, 96.96484375, 104.927734375, 112.890625, 120.853515625, 128.81640625, 136.779296875, 144.7421875, 152.705078125, 160.66796875, 168.630859375, 176.59375, 184.556640625, 192.51953125, 200.482421875, 208.4453125, 216.408203125, 224.37109375, 232.333984375, 240.296875, 248.259765625, 256.22265625, 264.185546875, 272.1484375, 280.111328125, 288.07421875, 296.037109375, 304.0]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 9.0, 12.0, 16.0, 41.0, 53.0, 103.0, 160.0, 187.0, 181.0, 103.0, 52.0, 33.0, 25.0, 16.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-200.2373046875, -195.05848693847656, -189.87966918945312, -184.7008514404297, -179.52203369140625, -174.34323120117188, -169.16441345214844, -163.985595703125, -158.80677795410156, -153.62796020507812, -148.4491424560547, -143.27032470703125, -138.09152221679688, -132.91270446777344, -127.73388671875, -122.55506896972656, -117.37625122070312, -112.19743347167969, -107.01861572265625, -101.83980560302734, -96.6609878540039, -91.48217010498047, -86.30335998535156, -81.12454223632812, -75.94572448730469, -70.76690673828125, -65.58808898925781, -60.409278869628906, -55.23046112060547, -50.05164337158203, -44.87282943725586, -39.69401550292969, -34.51519775390625, -29.336381912231445, -24.15756607055664, -18.978750228881836, -13.799934387207031, -8.621118545532227, -3.442302703857422, 1.73651123046875, 6.9153289794921875, 12.094144821166992, 17.272960662841797, 22.4517765045166, 27.630592346191406, 32.809410095214844, 37.988224029541016, 43.16703796386719, 48.345855712890625, 53.52467346191406, 58.703487396240234, 63.882301330566406, 69.06111907958984, 74.23993682861328, 79.41874694824219, 84.59756469726562, 89.77638244628906, 94.9552001953125, 100.13401794433594, 105.31282806396484, 110.49164581298828, 115.67046356201172, 120.84927368164062, 126.02809143066406, 131.2069091796875]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 4.0, 4.0, 8.0, 8.0, 7.0, 15.0, 15.0, 18.0, 24.0, 13.0, 14.0, 15.0, 21.0, 29.0, 33.0, 22.0, 42.0, 20.0, 31.0, 26.0, 40.0, 36.0, 24.0, 37.0, 48.0, 30.0, 27.0, 37.0, 35.0, 26.0, 30.0, 27.0, 21.0, 26.0, 22.0, 13.0, 20.0, 17.0, 16.0, 17.0, 20.0, 9.0, 9.0, 7.0, 8.0, 6.0, 6.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0], "bins": [-74.56011962890625, -72.2015151977539, -69.8429183959961, -67.48431396484375, -65.1257095336914, -62.76710891723633, -60.40850830078125, -58.049903869628906, -55.69130325317383, -53.33270263671875, -50.974098205566406, -48.61549758911133, -46.25689697265625, -43.898292541503906, -41.53969192504883, -39.18109130859375, -36.822486877441406, -34.46388626098633, -32.105281829833984, -29.746681213378906, -27.388078689575195, -25.029476165771484, -22.670875549316406, -20.312273025512695, -17.953670501708984, -15.595067977905273, -13.236466407775879, -10.877864837646484, -8.519262313842773, -6.1606597900390625, -3.802058219909668, -1.4434566497802734, 0.9151535034179688, 3.2737555503845215, 5.632357597351074, 7.990959644317627, 10.34956169128418, 12.70816421508789, 15.066765785217285, 17.42536735534668, 19.78396987915039, 22.1425724029541, 24.501174926757812, 26.85977554321289, 29.2183780670166, 31.576980590820312, 33.93558120727539, 36.29418182373047, 38.65278625488281, 41.01138687133789, 43.369991302490234, 45.72859191894531, 48.087196350097656, 50.445796966552734, 52.80439758300781, 55.163002014160156, 57.521602630615234, 59.88020324707031, 62.238807678222656, 64.597412109375, 66.95600891113281, 69.31461334228516, 71.6732177734375, 74.03181457519531, 76.39041900634766]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 7.0, 11.0, 17.0, 17.0, 15.0, 19.0, 21.0, 36.0, 41.0, 35.0, 34.0, 37.0, 52.0, 42.0, 57.0, 57.0, 45.0, 49.0, 45.0, 37.0, 44.0, 28.0, 34.0, 26.0, 33.0, 23.0, 18.0, 16.0, 15.0, 7.0, 21.0, 13.0, 7.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-22.953125, -22.313720703125, -21.67431640625, -21.034912109375, -20.3955078125, -19.756103515625, -19.11669921875, -18.477294921875, -17.837890625, -17.198486328125, -16.55908203125, -15.919677734375, -15.2802734375, -14.640869140625, -14.00146484375, -13.362060546875, -12.72265625, -12.083251953125, -11.44384765625, -10.804443359375, -10.1650390625, -9.525634765625, -8.88623046875, -8.246826171875, -7.607421875, -6.968017578125, -6.32861328125, -5.689208984375, -5.0498046875, -4.410400390625, -3.77099609375, -3.131591796875, -2.4921875, -1.852783203125, -1.21337890625, -0.573974609375, 0.0654296875, 0.704833984375, 1.34423828125, 1.983642578125, 2.623046875, 3.262451171875, 3.90185546875, 4.541259765625, 5.1806640625, 5.820068359375, 6.45947265625, 7.098876953125, 7.73828125, 8.377685546875, 9.01708984375, 9.656494140625, 10.2958984375, 10.935302734375, 11.57470703125, 12.214111328125, 12.853515625, 13.492919921875, 14.13232421875, 14.771728515625, 15.4111328125, 16.050537109375, 16.68994140625, 17.329345703125, 17.96875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 1.0, 2.0, 13.0, 4.0, 12.0, 19.0, 24.0, 34.0, 56.0, 94.0, 136.0, 154.0, 315.0, 437.0, 652.0, 953.0, 1469.0, 2408.0, 3796.0, 6126.0, 10026.0, 16977.0, 29484.0, 53609.0, 101979.0, 211634.0, 291223.0, 146906.0, 73802.0, 39618.0, 22450.0, 12831.0, 7747.0, 5002.0, 3054.0, 1964.0, 1220.0, 791.0, 493.0, 353.0, 237.0, 135.0, 116.0, 61.0, 42.0, 36.0, 17.0, 20.0, 6.0, 12.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.9736328125, -1.912445068359375, -1.85125732421875, -1.790069580078125, -1.7288818359375, -1.667694091796875, -1.60650634765625, -1.545318603515625, -1.484130859375, -1.422943115234375, -1.36175537109375, -1.300567626953125, -1.2393798828125, -1.178192138671875, -1.11700439453125, -1.055816650390625, -0.99462890625, -0.933441162109375, -0.87225341796875, -0.811065673828125, -0.7498779296875, -0.688690185546875, -0.62750244140625, -0.566314697265625, -0.505126953125, -0.443939208984375, -0.38275146484375, -0.321563720703125, -0.2603759765625, -0.199188232421875, -0.13800048828125, -0.076812744140625, -0.015625, 0.045562744140625, 0.10675048828125, 0.167938232421875, 0.2291259765625, 0.290313720703125, 0.35150146484375, 0.412689208984375, 0.473876953125, 0.535064697265625, 0.59625244140625, 0.657440185546875, 0.7186279296875, 0.779815673828125, 0.84100341796875, 0.902191162109375, 0.96337890625, 1.024566650390625, 1.08575439453125, 1.146942138671875, 1.2081298828125, 1.269317626953125, 1.33050537109375, 1.391693115234375, 1.452880859375, 1.514068603515625, 1.57525634765625, 1.636444091796875, 1.6976318359375, 1.758819580078125, 1.82000732421875, 1.881195068359375, 1.9423828125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 5.0, 1.0, 7.0, 6.0, 9.0, 7.0, 9.0, 12.0, 9.0, 20.0, 13.0, 20.0, 31.0, 28.0, 28.0, 36.0, 24.0, 41.0, 49.0, 32.0, 46.0, 32.0, 46.0, 1070.0, 38.0, 37.0, 45.0, 26.0, 40.0, 26.0, 26.0, 29.0, 22.0, 27.0, 24.0, 18.0, 19.0, 10.0, 11.0, 12.0, 9.0, 8.0, 2.0, 5.0, 2.0, 1.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.328125, -10.974609375, -10.62109375, -10.267578125, -9.9140625, -9.560546875, -9.20703125, -8.853515625, -8.5, -8.146484375, -7.79296875, -7.439453125, -7.0859375, -6.732421875, -6.37890625, -6.025390625, -5.671875, -5.318359375, -4.96484375, -4.611328125, -4.2578125, -3.904296875, -3.55078125, -3.197265625, -2.84375, -2.490234375, -2.13671875, -1.783203125, -1.4296875, -1.076171875, -0.72265625, -0.369140625, -0.015625, 0.337890625, 0.69140625, 1.044921875, 1.3984375, 1.751953125, 2.10546875, 2.458984375, 2.8125, 3.166015625, 3.51953125, 3.873046875, 4.2265625, 4.580078125, 4.93359375, 5.287109375, 5.640625, 5.994140625, 6.34765625, 6.701171875, 7.0546875, 7.408203125, 7.76171875, 8.115234375, 8.46875, 8.822265625, 9.17578125, 9.529296875, 9.8828125, 10.236328125, 10.58984375, 10.943359375, 11.296875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 2.0, 10.0, 12.0, 20.0, 29.0, 42.0, 57.0, 65.0, 122.0, 180.0, 241.0, 442.0, 684.0, 1061.0, 1586.0, 2517.0, 4256.0, 6785.0, 11446.0, 19248.0, 33523.0, 60038.0, 115828.0, 359468.0, 1213844.0, 119790.0, 61564.0, 34510.0, 19583.0, 11699.0, 7086.0, 4195.0, 2609.0, 1664.0, 989.0, 674.0, 405.0, 255.0, 204.0, 126.0, 81.0, 53.0, 39.0, 29.0, 16.0, 15.0, 16.0, 5.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0], "bins": [-1.96484375, -1.9070892333984375, -1.849334716796875, -1.7915802001953125, -1.73382568359375, -1.6760711669921875, -1.618316650390625, -1.5605621337890625, -1.5028076171875, -1.4450531005859375, -1.387298583984375, -1.3295440673828125, -1.27178955078125, -1.2140350341796875, -1.156280517578125, -1.0985260009765625, -1.040771484375, -0.9830169677734375, -0.925262451171875, -0.8675079345703125, -0.80975341796875, -0.7519989013671875, -0.694244384765625, -0.6364898681640625, -0.5787353515625, -0.5209808349609375, -0.463226318359375, -0.4054718017578125, -0.34771728515625, -0.2899627685546875, -0.232208251953125, -0.1744537353515625, -0.11669921875, -0.0589447021484375, -0.001190185546875, 0.0565643310546875, 0.11431884765625, 0.1720733642578125, 0.229827880859375, 0.2875823974609375, 0.3453369140625, 0.4030914306640625, 0.460845947265625, 0.5186004638671875, 0.57635498046875, 0.6341094970703125, 0.691864013671875, 0.7496185302734375, 0.807373046875, 0.8651275634765625, 0.922882080078125, 0.9806365966796875, 1.03839111328125, 1.0961456298828125, 1.153900146484375, 1.2116546630859375, 1.2694091796875, 1.3271636962890625, 1.384918212890625, 1.4426727294921875, 1.50042724609375, 1.5581817626953125, 1.615936279296875, 1.6736907958984375, 1.7314453125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 7.0, 3.0, 7.0, 3.0, 5.0, 8.0, 6.0, 7.0, 15.0, 17.0, 16.0, 22.0, 29.0, 27.0, 30.0, 42.0, 52.0, 51.0, 49.0, 60.0, 62.0, 65.0, 57.0, 51.0, 37.0, 40.0, 31.0, 27.0, 29.0, 24.0, 21.0, 23.0, 16.0, 9.0, 12.0, 4.0, 9.0, 3.0, 7.0, 2.0, 4.0, 0.0, 6.0, 2.0, 0.0, 2.0, 2.0, 5.0], "bins": [-0.005199432373046875, -0.005057871341705322, -0.0049163103103637695, -0.004774749279022217, -0.004633188247680664, -0.004491627216339111, -0.004350066184997559, -0.004208505153656006, -0.004066944122314453, -0.0039253830909729, -0.0037838220596313477, -0.003642261028289795, -0.003500699996948242, -0.0033591389656066895, -0.0032175779342651367, -0.003076016902923584, -0.0029344558715820312, -0.0027928948402404785, -0.0026513338088989258, -0.002509772777557373, -0.0023682117462158203, -0.0022266507148742676, -0.002085089683532715, -0.0019435286521911621, -0.0018019676208496094, -0.0016604065895080566, -0.001518845558166504, -0.0013772845268249512, -0.0012357234954833984, -0.0010941624641418457, -0.000952601432800293, -0.0008110404014587402, -0.0006694793701171875, -0.0005279183387756348, -0.00038635730743408203, -0.0002447962760925293, -0.00010323524475097656, 3.832578659057617e-05, 0.0001798868179321289, 0.00032144784927368164, 0.0004630088806152344, 0.0006045699119567871, 0.0007461309432983398, 0.0008876919746398926, 0.0010292530059814453, 0.001170814037322998, 0.0013123750686645508, 0.0014539361000061035, 0.0015954971313476562, 0.001737058162689209, 0.0018786191940307617, 0.0020201802253723145, 0.002161741256713867, 0.00230330228805542, 0.0024448633193969727, 0.0025864243507385254, 0.002727985382080078, 0.002869546413421631, 0.0030111074447631836, 0.0031526684761047363, 0.003294229507446289, 0.003435790538787842, 0.0035773515701293945, 0.0037189126014709473, 0.0038604736328125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 6.0, 6.0, 5.0, 9.0, 13.0, 10.0, 13.0, 19.0, 20.0, 22.0, 32.0, 38.0, 48.0, 48.0, 60.0, 102.0, 128.0, 235.0, 445.0, 2141.0, 162935.0, 875369.0, 5290.0, 617.0, 254.0, 186.0, 111.0, 86.0, 60.0, 53.0, 26.0, 27.0, 25.0, 22.0, 12.0, 14.0, 11.0, 14.0, 10.0, 5.0, 6.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.076416015625, -0.07360172271728516, -0.07078742980957031, -0.06797313690185547, -0.06515884399414062, -0.06234455108642578, -0.05953025817871094, -0.056715965270996094, -0.05390167236328125, -0.051087379455566406, -0.04827308654785156, -0.04545879364013672, -0.042644500732421875, -0.03983020782470703, -0.03701591491699219, -0.034201622009277344, -0.0313873291015625, -0.028573036193847656, -0.025758743286132812, -0.02294445037841797, -0.020130157470703125, -0.01731586456298828, -0.014501571655273438, -0.011687278747558594, -0.00887298583984375, -0.006058692932128906, -0.0032444000244140625, -0.00043010711669921875, 0.002384185791015625, 0.005198478698730469, 0.008012771606445312, 0.010827064514160156, 0.013641357421875, 0.016455650329589844, 0.019269943237304688, 0.02208423614501953, 0.024898529052734375, 0.02771282196044922, 0.030527114868164062, 0.033341407775878906, 0.03615570068359375, 0.038969993591308594, 0.04178428649902344, 0.04459857940673828, 0.047412872314453125, 0.05022716522216797, 0.05304145812988281, 0.055855751037597656, 0.0586700439453125, 0.061484336853027344, 0.06429862976074219, 0.06711292266845703, 0.06992721557617188, 0.07274150848388672, 0.07555580139160156, 0.0783700942993164, 0.08118438720703125, 0.0839986801147461, 0.08681297302246094, 0.08962726593017578, 0.09244155883789062, 0.09525585174560547, 0.09807014465332031, 0.10088443756103516, 0.10369873046875]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 9.0, 27.0, 116.0, 448.0, 305.0, 81.0, 17.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012333228252828121, -0.0119457533583045, -0.011558277532458305, -0.011170802637934685, -0.01078332681208849, -0.010395851917564869, -0.010008376091718674, -0.009620901197195053, -0.009233426302671432, -0.008845951408147812, -0.008458475582301617, -0.008071000687777996, -0.007683524861931801, -0.00729604996740818, -0.006908574607223272, -0.006521099247038364, -0.006133623421192169, -0.005746148061007261, -0.005358672700822353, -0.004971197806298733, -0.0045837219804525375, -0.004196247085928917, -0.003808771725744009, -0.003421296365559101, -0.003033821005374193, -0.0026463456451892853, -0.0022588702850043774, -0.001871395157650113, -0.0014839197974652052, -0.0010964444372802973, -0.000708969309926033, -0.0003214939497411251, 6.598234176635742e-05, 0.0004534576437436044, 0.0008409329457208514, 0.0012284081894904375, 0.0016158835496753454, 0.0020033589098602533, 0.0023908340372145176, 0.0027783093973994255, 0.0031657847575843334, 0.0035532601177692413, 0.003940735477954149, 0.004328210838139057, 0.004715685732662678, 0.005103161558508873, 0.005490636453032494, 0.0058781118132174015, 0.006265587173402309, 0.006653062533587217, 0.007040537893772125, 0.007428012788295746, 0.007815488614141941, 0.008202963508665562, 0.008590439334511757, 0.008977914229035378, 0.009365389123558998, 0.009752864018082619, 0.010140339843928814, 0.010527814738452435, 0.01091529056429863, 0.01130276545882225, 0.011690240353345871, 0.012077716179192066, 0.012465192005038261]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 6.0, 4.0, 7.0, 5.0, 9.0, 15.0, 10.0, 12.0, 16.0, 27.0, 32.0, 24.0, 37.0, 37.0, 36.0, 43.0, 39.0, 34.0, 40.0, 38.0, 36.0, 42.0, 34.0, 40.0, 35.0, 29.0, 32.0, 24.0, 28.0, 28.0, 26.0, 26.0, 28.0, 19.0, 12.0, 17.0, 15.0, 12.0, 8.0, 6.0, 7.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002292037010192871, -0.0022124405950307846, -0.002132844179868698, -0.0020532477647066116, -0.001973651349544525, -0.0018940549343824387, -0.0018144585192203522, -0.0017348621040582657, -0.0016552656888961792, -0.0015756692737340927, -0.0014960728585720062, -0.0014164764434099197, -0.0013368800282478333, -0.0012572836130857468, -0.0011776871979236603, -0.0010980907827615738, -0.0010184943675994873, -0.0009388979524374008, -0.0008593015372753143, -0.0007797051221132278, -0.0007001087069511414, -0.0006205122917890549, -0.0005409158766269684, -0.0004613194614648819, -0.0003817230463027954, -0.0003021266311407089, -0.00022253021597862244, -0.00014293380081653595, -6.333738565444946e-05, 1.6259029507637024e-05, 9.585544466972351e-05, 0.00017545185983181, 0.0002550482749938965, 0.00033464469015598297, 0.00041424110531806946, 0.0004938375204801559, 0.0005734339356422424, 0.0006530303508043289, 0.0007326267659664154, 0.0008122231811285019, 0.0008918195962905884, 0.0009714160114526749, 0.0010510124266147614, 0.0011306088417768478, 0.0012102052569389343, 0.0012898016721010208, 0.0013693980872631073, 0.0014489945024251938, 0.0015285909175872803, 0.0016081873327493668, 0.0016877837479114532, 0.0017673801630735397, 0.0018469765782356262, 0.0019265729933977127, 0.002006169408559799, 0.0020857658237218857, 0.002165362238883972, 0.0022449586540460587, 0.002324555069208145, 0.0024041514843702316, 0.002483747899532318, 0.0025633443146944046, 0.002642940729856491, 0.0027225371450185776, 0.002802133560180664]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 9.0, 7.0, 11.0, 17.0, 17.0, 15.0, 19.0, 21.0, 36.0, 41.0, 35.0, 34.0, 37.0, 52.0, 42.0, 57.0, 57.0, 45.0, 49.0, 45.0, 37.0, 44.0, 28.0, 34.0, 26.0, 33.0, 23.0, 18.0, 16.0, 15.0, 7.0, 21.0, 13.0, 7.0, 5.0, 7.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-22.953125, -22.313720703125, -21.67431640625, -21.034912109375, -20.3955078125, -19.756103515625, -19.11669921875, -18.477294921875, -17.837890625, -17.198486328125, -16.55908203125, -15.919677734375, -15.2802734375, -14.640869140625, -14.00146484375, -13.362060546875, -12.72265625, -12.083251953125, -11.44384765625, -10.804443359375, -10.1650390625, -9.525634765625, -8.88623046875, -8.246826171875, -7.607421875, -6.968017578125, -6.32861328125, -5.689208984375, -5.0498046875, -4.410400390625, -3.77099609375, -3.131591796875, -2.4921875, -1.852783203125, -1.21337890625, -0.573974609375, 0.0654296875, 0.704833984375, 1.34423828125, 1.983642578125, 2.623046875, 3.262451171875, 3.90185546875, 4.541259765625, 5.1806640625, 5.820068359375, 6.45947265625, 7.098876953125, 7.73828125, 8.377685546875, 9.01708984375, 9.656494140625, 10.2958984375, 10.935302734375, 11.57470703125, 12.214111328125, 12.853515625, 13.492919921875, 14.13232421875, 14.771728515625, 15.4111328125, 16.050537109375, 16.68994140625, 17.329345703125, 17.96875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 8.0, 13.0, 12.0, 19.0, 20.0, 32.0, 45.0, 47.0, 91.0, 111.0, 162.0, 282.0, 456.0, 886.0, 1887.0, 5820.0, 32838.0, 768722.0, 214958.0, 15325.0, 3644.0, 1422.0, 673.0, 367.0, 195.0, 136.0, 96.0, 68.0, 55.0, 31.0, 26.0, 16.0, 25.0, 17.0, 13.0, 7.0, 8.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0], "bins": [-42.84375, -41.6474609375, -40.451171875, -39.2548828125, -38.05859375, -36.8623046875, -35.666015625, -34.4697265625, -33.2734375, -32.0771484375, -30.880859375, -29.6845703125, -28.48828125, -27.2919921875, -26.095703125, -24.8994140625, -23.703125, -22.5068359375, -21.310546875, -20.1142578125, -18.91796875, -17.7216796875, -16.525390625, -15.3291015625, -14.1328125, -12.9365234375, -11.740234375, -10.5439453125, -9.34765625, -8.1513671875, -6.955078125, -5.7587890625, -4.5625, -3.3662109375, -2.169921875, -0.9736328125, 0.22265625, 1.4189453125, 2.615234375, 3.8115234375, 5.0078125, 6.2041015625, 7.400390625, 8.5966796875, 9.79296875, 10.9892578125, 12.185546875, 13.3818359375, 14.578125, 15.7744140625, 16.970703125, 18.1669921875, 19.36328125, 20.5595703125, 21.755859375, 22.9521484375, 24.1484375, 25.3447265625, 26.541015625, 27.7373046875, 28.93359375, 30.1298828125, 31.326171875, 32.5224609375, 33.71875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 10.0, 10.0, 11.0, 9.0, 8.0, 14.0, 20.0, 21.0, 14.0, 27.0, 30.0, 47.0, 48.0, 45.0, 46.0, 58.0, 75.0, 280.0, 1740.0, 92.0, 64.0, 48.0, 47.0, 48.0, 23.0, 41.0, 26.0, 21.0, 19.0, 17.0, 9.0, 21.0, 14.0, 13.0, 5.0, 4.0, 6.0, 1.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.625, -60.4775390625, -58.330078125, -56.1826171875, -54.03515625, -51.8876953125, -49.740234375, -47.5927734375, -45.4453125, -43.2978515625, -41.150390625, -39.0029296875, -36.85546875, -34.7080078125, -32.560546875, -30.4130859375, -28.265625, -26.1181640625, -23.970703125, -21.8232421875, -19.67578125, -17.5283203125, -15.380859375, -13.2333984375, -11.0859375, -8.9384765625, -6.791015625, -4.6435546875, -2.49609375, -0.3486328125, 1.798828125, 3.9462890625, 6.09375, 8.2412109375, 10.388671875, 12.5361328125, 14.68359375, 16.8310546875, 18.978515625, 21.1259765625, 23.2734375, 25.4208984375, 27.568359375, 29.7158203125, 31.86328125, 34.0107421875, 36.158203125, 38.3056640625, 40.453125, 42.6005859375, 44.748046875, 46.8955078125, 49.04296875, 51.1904296875, 53.337890625, 55.4853515625, 57.6328125, 59.7802734375, 61.927734375, 64.0751953125, 66.22265625, 68.3701171875, 70.517578125, 72.6650390625, 74.8125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 7.0, 5.0, 7.0, 13.0, 10.0, 16.0, 17.0, 22.0, 22.0, 24.0, 33.0, 52.0, 51.0, 85.0, 123.0, 201.0, 432.0, 2848.0, 3093018.0, 46721.0, 1065.0, 300.0, 178.0, 98.0, 80.0, 65.0, 36.0, 32.0, 17.0, 23.0, 23.0, 15.0, 8.0, 11.0, 10.0, 10.0, 12.0, 4.0, 5.0, 0.0, 4.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-225.625, -219.140625, -212.65625, -206.171875, -199.6875, -193.203125, -186.71875, -180.234375, -173.75, -167.265625, -160.78125, -154.296875, -147.8125, -141.328125, -134.84375, -128.359375, -121.875, -115.390625, -108.90625, -102.421875, -95.9375, -89.453125, -82.96875, -76.484375, -70.0, -63.515625, -57.03125, -50.546875, -44.0625, -37.578125, -31.09375, -24.609375, -18.125, -11.640625, -5.15625, 1.328125, 7.8125, 14.296875, 20.78125, 27.265625, 33.75, 40.234375, 46.71875, 53.203125, 59.6875, 66.171875, 72.65625, 79.140625, 85.625, 92.109375, 98.59375, 105.078125, 111.5625, 118.046875, 124.53125, 131.015625, 137.5, 143.984375, 150.46875, 156.953125, 163.4375, 169.921875, 176.40625, 182.890625, 189.375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 35.0, 258.0, 542.0, 152.0, 21.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-261.8152160644531, -256.283935546875, -250.75267028808594, -245.2213897705078, -239.69012451171875, -234.15884399414062, -228.6275634765625, -223.09629821777344, -217.56503295898438, -212.03375244140625, -206.5024871826172, -200.97120666503906, -195.43994140625, -189.90866088867188, -184.37738037109375, -178.8461151123047, -173.31483459472656, -167.78355407714844, -162.25228881835938, -156.72100830078125, -151.1897430419922, -145.65846252441406, -140.127197265625, -134.59591674804688, -129.06463623046875, -123.53336334228516, -118.00209045410156, -112.47080993652344, -106.93954467773438, -101.40826416015625, -95.87699127197266, -90.34571838378906, -84.814453125, -79.2831802368164, -73.75190734863281, -68.22062683105469, -62.68935775756836, -57.158084869384766, -51.626808166503906, -46.09553527832031, -40.56426239013672, -35.032989501953125, -29.5017147064209, -23.970439910888672, -18.439167022705078, -12.907894134521484, -7.376617431640625, -1.8453445434570312, 3.6859283447265625, 9.217202186584473, 14.748476028442383, 20.27975082397461, 25.811023712158203, 31.342296600341797, 36.873573303222656, 42.40484619140625, 47.936119079589844, 53.46739196777344, 58.99866485595703, 64.52993774414062, 70.06121826171875, 75.59248352050781, 81.12376403808594, 86.65503692626953, 92.18630981445312]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 0.0, 1.0, 3.0, 3.0, 7.0, 7.0, 14.0, 19.0, 9.0, 12.0, 17.0, 17.0, 21.0, 19.0, 24.0, 34.0, 40.0, 38.0, 32.0, 39.0, 45.0, 45.0, 39.0, 48.0, 37.0, 39.0, 45.0, 39.0, 29.0, 41.0, 38.0, 32.0, 19.0, 21.0, 30.0, 16.0, 19.0, 15.0, 9.0, 12.0, 7.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-177.72073364257812, -172.51834106445312, -167.31593322753906, -162.113525390625, -156.9111328125, -151.708740234375, -146.50633239746094, -141.30392456054688, -136.10153198242188, -130.89913940429688, -125.69673156738281, -120.49433135986328, -115.29193115234375, -110.08953094482422, -104.88713073730469, -99.68473052978516, -94.48233032226562, -89.2799301147461, -84.07752990722656, -78.87512969970703, -73.6727294921875, -68.47032928466797, -63.26792907714844, -58.065528869628906, -52.863128662109375, -47.660728454589844, -42.45832824707031, -37.25592803955078, -32.05352783203125, -26.85112762451172, -21.648727416992188, -16.446327209472656, -11.243927001953125, -6.041526794433594, -0.8391265869140625, 4.363273620605469, 9.565673828125, 14.768074035644531, 19.970474243164062, 25.172874450683594, 30.375274658203125, 35.577674865722656, 40.78007507324219, 45.98247528076172, 51.18487548828125, 56.38727569580078, 61.58967590332031, 66.79207611083984, 71.99447631835938, 77.1968765258789, 82.39927673339844, 87.60167694091797, 92.8040771484375, 98.00647735595703, 103.20887756347656, 108.4112777709961, 113.61367797851562, 118.81607818603516, 124.01847839355469, 129.22088623046875, 134.42327880859375, 139.62567138671875, 144.8280792236328, 150.03048706054688, 155.23287963867188]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 5.0, 8.0, 4.0, 13.0, 12.0, 8.0, 17.0, 28.0, 22.0, 24.0, 30.0, 33.0, 32.0, 33.0, 50.0, 55.0, 45.0, 45.0, 53.0, 35.0, 48.0, 44.0, 39.0, 34.0, 29.0, 39.0, 31.0, 26.0, 21.0, 24.0, 23.0, 13.0, 17.0, 10.0, 15.0, 3.0, 11.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0], "bins": [-23.390625, -22.739501953125, -22.08837890625, -21.437255859375, -20.7861328125, -20.135009765625, -19.48388671875, -18.832763671875, -18.181640625, -17.530517578125, -16.87939453125, -16.228271484375, -15.5771484375, -14.926025390625, -14.27490234375, -13.623779296875, -12.97265625, -12.321533203125, -11.67041015625, -11.019287109375, -10.3681640625, -9.717041015625, -9.06591796875, -8.414794921875, -7.763671875, -7.112548828125, -6.46142578125, -5.810302734375, -5.1591796875, -4.508056640625, -3.85693359375, -3.205810546875, -2.5546875, -1.903564453125, -1.25244140625, -0.601318359375, 0.0498046875, 0.700927734375, 1.35205078125, 2.003173828125, 2.654296875, 3.305419921875, 3.95654296875, 4.607666015625, 5.2587890625, 5.909912109375, 6.56103515625, 7.212158203125, 7.86328125, 8.514404296875, 9.16552734375, 9.816650390625, 10.4677734375, 11.118896484375, 11.77001953125, 12.421142578125, 13.072265625, 13.723388671875, 14.37451171875, 15.025634765625, 15.6767578125, 16.327880859375, 16.97900390625, 17.630126953125, 18.28125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 5.0, 15.0, 12.0, 22.0, 30.0, 52.0, 58.0, 78.0, 105.0, 167.0, 272.0, 414.0, 731.0, 1262.0, 2522.0, 5364.0, 16154.0, 216010.0, 2563632.0, 1296000.0, 71477.0, 10759.0, 4130.0, 2106.0, 1103.0, 624.0, 389.0, 236.0, 151.0, 97.0, 85.0, 51.0, 34.0, 29.0, 29.0, 19.0, 6.0, 8.0, 10.0, 6.0, 2.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-48.5625, -47.16796875, -45.7734375, -44.37890625, -42.984375, -41.58984375, -40.1953125, -38.80078125, -37.40625, -36.01171875, -34.6171875, -33.22265625, -31.828125, -30.43359375, -29.0390625, -27.64453125, -26.25, -24.85546875, -23.4609375, -22.06640625, -20.671875, -19.27734375, -17.8828125, -16.48828125, -15.09375, -13.69921875, -12.3046875, -10.91015625, -9.515625, -8.12109375, -6.7265625, -5.33203125, -3.9375, -2.54296875, -1.1484375, 0.24609375, 1.640625, 3.03515625, 4.4296875, 5.82421875, 7.21875, 8.61328125, 10.0078125, 11.40234375, 12.796875, 14.19140625, 15.5859375, 16.98046875, 18.375, 19.76953125, 21.1640625, 22.55859375, 23.953125, 25.34765625, 26.7421875, 28.13671875, 29.53125, 30.92578125, 32.3203125, 33.71484375, 35.109375, 36.50390625, 37.8984375, 39.29296875, 40.6875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 2.0, 5.0, 7.0, 11.0, 14.0, 24.0, 31.0, 39.0, 61.0, 106.0, 247.0, 541.0, 1038.0, 998.0, 482.0, 199.0, 94.0, 60.0, 30.0, 27.0, 18.0, 12.0, 11.0, 2.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.375, -33.6015625, -31.828125, -30.0546875, -28.28125, -26.5078125, -24.734375, -22.9609375, -21.1875, -19.4140625, -17.640625, -15.8671875, -14.09375, -12.3203125, -10.546875, -8.7734375, -7.0, -5.2265625, -3.453125, -1.6796875, 0.09375, 1.8671875, 3.640625, 5.4140625, 7.1875, 8.9609375, 10.734375, 12.5078125, 14.28125, 16.0546875, 17.828125, 19.6015625, 21.375, 23.1484375, 24.921875, 26.6953125, 28.46875, 30.2421875, 32.015625, 33.7890625, 35.5625, 37.3359375, 39.109375, 40.8828125, 42.65625, 44.4296875, 46.203125, 47.9765625, 49.75, 51.5234375, 53.296875, 55.0703125, 56.84375, 58.6171875, 60.390625, 62.1640625, 63.9375, 65.7109375, 67.484375, 69.2578125, 71.03125, 72.8046875, 74.578125, 76.3515625, 78.125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 4.0, 8.0, 19.0, 28.0, 44.0, 94.0, 187.0, 443.0, 1523.0, 9538.0, 454503.0, 3707629.0, 16900.0, 2263.0, 581.0, 243.0, 102.0, 65.0, 39.0, 21.0, 12.0, 7.0, 8.0, 8.0, 2.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-247.0, -241.271484375, -235.54296875, -229.814453125, -224.0859375, -218.357421875, -212.62890625, -206.900390625, -201.171875, -195.443359375, -189.71484375, -183.986328125, -178.2578125, -172.529296875, -166.80078125, -161.072265625, -155.34375, -149.615234375, -143.88671875, -138.158203125, -132.4296875, -126.701171875, -120.97265625, -115.244140625, -109.515625, -103.787109375, -98.05859375, -92.330078125, -86.6015625, -80.873046875, -75.14453125, -69.416015625, -63.6875, -57.958984375, -52.23046875, -46.501953125, -40.7734375, -35.044921875, -29.31640625, -23.587890625, -17.859375, -12.130859375, -6.40234375, -0.673828125, 5.0546875, 10.783203125, 16.51171875, 22.240234375, 27.96875, 33.697265625, 39.42578125, 45.154296875, 50.8828125, 56.611328125, 62.33984375, 68.068359375, 73.796875, 79.525390625, 85.25390625, 90.982421875, 96.7109375, 102.439453125, 108.16796875, 113.896484375, 119.625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 11.0, 34.0, 77.0, 201.0, 332.0, 207.0, 77.0, 41.0, 14.0, 10.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-353.7979431152344, -343.8592224121094, -333.9205322265625, -323.9818115234375, -314.0431213378906, -304.1044006347656, -294.16571044921875, -284.22698974609375, -274.2882995605469, -264.3495788574219, -254.410888671875, -244.47218322753906, -234.53347778320312, -224.5947723388672, -214.65606689453125, -204.71734619140625, -194.7786407470703, -184.83993530273438, -174.90122985839844, -164.9625244140625, -155.02381896972656, -145.08511352539062, -135.14639282226562, -125.20769500732422, -115.26898956298828, -105.33028411865234, -95.3915786743164, -85.45286560058594, -75.51416015625, -65.57545471191406, -55.636749267578125, -45.69804382324219, -35.75933837890625, -25.820632934570312, -15.881925582885742, -5.943218231201172, 3.9954872131347656, 13.934192657470703, 23.872901916503906, 33.811607360839844, 43.75031280517578, 53.68901824951172, 63.627723693847656, 73.56643676757812, 83.50514221191406, 93.44384765625, 103.38255310058594, 113.32125854492188, 123.25996398925781, 133.19866943359375, 143.1373748779297, 153.07608032226562, 163.01478576660156, 172.9534912109375, 182.8922119140625, 192.83090209960938, 202.76962280273438, 212.7083282470703, 222.64703369140625, 232.5857391357422, 242.52444458007812, 252.46315002441406, 262.40185546875, 272.340576171875, 282.2792663574219]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 9.0, 5.0, 9.0, 6.0, 7.0, 8.0, 7.0, 23.0, 25.0, 25.0, 24.0, 29.0, 26.0, 35.0, 32.0, 33.0, 36.0, 27.0, 30.0, 48.0, 42.0, 49.0, 38.0, 41.0, 39.0, 36.0, 35.0, 34.0, 32.0, 20.0, 23.0, 25.0, 17.0, 21.0, 17.0, 17.0, 9.0, 16.0, 4.0, 1.0, 6.0, 7.0, 8.0, 4.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-102.43939208984375, -99.35327911376953, -96.26717376708984, -93.18106079101562, -90.09495544433594, -87.00884246826172, -83.9227294921875, -80.83662414550781, -77.75051879882812, -74.6644058227539, -71.57830047607422, -68.4921875, -65.40608215332031, -62.319969177246094, -59.23386001586914, -56.14775085449219, -53.06163787841797, -49.975528717041016, -46.88941955566406, -43.803306579589844, -40.717201232910156, -37.63108825683594, -34.544979095458984, -31.45886993408203, -28.372760772705078, -25.286651611328125, -22.200542449951172, -19.114431381225586, -16.028322219848633, -12.94221305847168, -9.856101989746094, -6.769992828369141, -3.6838836669921875, -0.5977740287780762, 2.488335609436035, 5.574445724487305, 8.660554885864258, 11.746664047241211, 14.832775115966797, 17.91888427734375, 21.004993438720703, 24.091102600097656, 27.17721176147461, 30.263322830200195, 33.34943389892578, 36.43553924560547, 39.52165222167969, 42.60776138305664, 45.693870544433594, 48.77997970581055, 51.8660888671875, 54.95220184326172, 58.038307189941406, 61.124420166015625, 64.21052551269531, 67.29663848876953, 70.38275146484375, 73.46886444091797, 76.55496978759766, 79.64108276367188, 82.72718811035156, 85.81330108642578, 88.8994140625, 91.98551940917969, 95.07162475585938]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 6.0, 11.0, 11.0, 7.0, 13.0, 19.0, 20.0, 19.0, 23.0, 44.0, 39.0, 46.0, 52.0, 64.0, 37.0, 59.0, 49.0, 50.0, 48.0, 47.0, 35.0, 39.0, 44.0, 30.0, 35.0, 32.0, 16.0, 16.0, 15.0, 24.0, 8.0, 12.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.953125, -25.22607421875, -24.4990234375, -23.77197265625, -23.044921875, -22.31787109375, -21.5908203125, -20.86376953125, -20.13671875, -19.40966796875, -18.6826171875, -17.95556640625, -17.228515625, -16.50146484375, -15.7744140625, -15.04736328125, -14.3203125, -13.59326171875, -12.8662109375, -12.13916015625, -11.412109375, -10.68505859375, -9.9580078125, -9.23095703125, -8.50390625, -7.77685546875, -7.0498046875, -6.32275390625, -5.595703125, -4.86865234375, -4.1416015625, -3.41455078125, -2.6875, -1.96044921875, -1.2333984375, -0.50634765625, 0.220703125, 0.94775390625, 1.6748046875, 2.40185546875, 3.12890625, 3.85595703125, 4.5830078125, 5.31005859375, 6.037109375, 6.76416015625, 7.4912109375, 8.21826171875, 8.9453125, 9.67236328125, 10.3994140625, 11.12646484375, 11.853515625, 12.58056640625, 13.3076171875, 14.03466796875, 14.76171875, 15.48876953125, 16.2158203125, 16.94287109375, 17.669921875, 18.39697265625, 19.1240234375, 19.85107421875, 20.578125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 9.0, 9.0, 13.0, 16.0, 22.0, 39.0, 49.0, 85.0, 110.0, 155.0, 280.0, 403.0, 705.0, 1088.0, 1872.0, 3404.0, 6164.0, 12117.0, 24441.0, 53310.0, 124057.0, 324984.0, 289677.0, 110545.0, 47824.0, 22471.0, 11127.0, 5814.0, 3166.0, 1748.0, 1056.0, 646.0, 395.0, 263.0, 162.0, 106.0, 71.0, 45.0, 35.0, 21.0, 16.0, 19.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.361328125, -2.27972412109375, -2.1981201171875, -2.11651611328125, -2.034912109375, -1.95330810546875, -1.8717041015625, -1.79010009765625, -1.70849609375, -1.62689208984375, -1.5452880859375, -1.46368408203125, -1.382080078125, -1.30047607421875, -1.2188720703125, -1.13726806640625, -1.0556640625, -0.97406005859375, -0.8924560546875, -0.81085205078125, -0.729248046875, -0.64764404296875, -0.5660400390625, -0.48443603515625, -0.40283203125, -0.32122802734375, -0.2396240234375, -0.15802001953125, -0.076416015625, 0.00518798828125, 0.0867919921875, 0.16839599609375, 0.25, 0.33160400390625, 0.4132080078125, 0.49481201171875, 0.576416015625, 0.65802001953125, 0.7396240234375, 0.82122802734375, 0.90283203125, 0.98443603515625, 1.0660400390625, 1.14764404296875, 1.229248046875, 1.31085205078125, 1.3924560546875, 1.47406005859375, 1.5556640625, 1.63726806640625, 1.7188720703125, 1.80047607421875, 1.882080078125, 1.96368408203125, 2.0452880859375, 2.12689208984375, 2.20849609375, 2.29010009765625, 2.3717041015625, 2.45330810546875, 2.534912109375, 2.61651611328125, 2.6981201171875, 2.77972412109375, 2.861328125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 2.0, 3.0, 3.0, 6.0, 2.0, 7.0, 8.0, 16.0, 10.0, 22.0, 27.0, 18.0, 22.0, 23.0, 35.0, 25.0, 32.0, 30.0, 39.0, 30.0, 35.0, 27.0, 28.0, 37.0, 1061.0, 32.0, 30.0, 28.0, 48.0, 35.0, 33.0, 29.0, 27.0, 15.0, 28.0, 26.0, 28.0, 17.0, 17.0, 19.0, 18.0, 12.0, 13.0, 4.0, 8.0, 3.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-11.7265625, -11.3643798828125, -11.002197265625, -10.6400146484375, -10.27783203125, -9.9156494140625, -9.553466796875, -9.1912841796875, -8.8291015625, -8.4669189453125, -8.104736328125, -7.7425537109375, -7.38037109375, -7.0181884765625, -6.656005859375, -6.2938232421875, -5.931640625, -5.5694580078125, -5.207275390625, -4.8450927734375, -4.48291015625, -4.1207275390625, -3.758544921875, -3.3963623046875, -3.0341796875, -2.6719970703125, -2.309814453125, -1.9476318359375, -1.58544921875, -1.2232666015625, -0.861083984375, -0.4989013671875, -0.13671875, 0.2254638671875, 0.587646484375, 0.9498291015625, 1.31201171875, 1.6741943359375, 2.036376953125, 2.3985595703125, 2.7607421875, 3.1229248046875, 3.485107421875, 3.8472900390625, 4.20947265625, 4.5716552734375, 4.933837890625, 5.2960205078125, 5.658203125, 6.0203857421875, 6.382568359375, 6.7447509765625, 7.10693359375, 7.4691162109375, 7.831298828125, 8.1934814453125, 8.5556640625, 8.9178466796875, 9.280029296875, 9.6422119140625, 10.00439453125, 10.3665771484375, 10.728759765625, 11.0909423828125, 11.453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 6.0, 5.0, 21.0, 23.0, 36.0, 29.0, 58.0, 99.0, 151.0, 192.0, 269.0, 489.0, 715.0, 1190.0, 1815.0, 2849.0, 4483.0, 7320.0, 11395.0, 18901.0, 31480.0, 53932.0, 99414.0, 203671.0, 1329795.0, 145933.0, 75222.0, 42381.0, 24685.0, 15197.0, 9359.0, 5909.0, 3600.0, 2354.0, 1437.0, 929.0, 618.0, 393.0, 224.0, 185.0, 122.0, 64.0, 54.0, 36.0, 24.0, 23.0, 15.0, 10.0, 7.0, 4.0, 7.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8203125, -1.762115478515625, -1.70391845703125, -1.645721435546875, -1.5875244140625, -1.529327392578125, -1.47113037109375, -1.412933349609375, -1.354736328125, -1.296539306640625, -1.23834228515625, -1.180145263671875, -1.1219482421875, -1.063751220703125, -1.00555419921875, -0.947357177734375, -0.88916015625, -0.830963134765625, -0.77276611328125, -0.714569091796875, -0.6563720703125, -0.598175048828125, -0.53997802734375, -0.481781005859375, -0.423583984375, -0.365386962890625, -0.30718994140625, -0.248992919921875, -0.1907958984375, -0.132598876953125, -0.07440185546875, -0.016204833984375, 0.0419921875, 0.100189208984375, 0.15838623046875, 0.216583251953125, 0.2747802734375, 0.332977294921875, 0.39117431640625, 0.449371337890625, 0.507568359375, 0.565765380859375, 0.62396240234375, 0.682159423828125, 0.7403564453125, 0.798553466796875, 0.85675048828125, 0.914947509765625, 0.97314453125, 1.031341552734375, 1.08953857421875, 1.147735595703125, 1.2059326171875, 1.264129638671875, 1.32232666015625, 1.380523681640625, 1.438720703125, 1.496917724609375, 1.55511474609375, 1.613311767578125, 1.6715087890625, 1.729705810546875, 1.78790283203125, 1.846099853515625, 1.904296875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 6.0, 8.0, 11.0, 16.0, 23.0, 28.0, 22.0, 30.0, 42.0, 45.0, 47.0, 50.0, 74.0, 60.0, 71.0, 57.0, 55.0, 60.0, 51.0, 41.0, 38.0, 26.0, 36.0, 25.0, 7.0, 16.0, 4.0, 4.0, 10.0, 11.0, 0.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00435638427734375, -0.004197597503662109, -0.004038810729980469, -0.003880023956298828, -0.0037212371826171875, -0.003562450408935547, -0.0034036636352539062, -0.0032448768615722656, -0.003086090087890625, -0.0029273033142089844, -0.0027685165405273438, -0.002609729766845703, -0.0024509429931640625, -0.002292156219482422, -0.0021333694458007812, -0.0019745826721191406, -0.0018157958984375, -0.0016570091247558594, -0.0014982223510742188, -0.0013394355773925781, -0.0011806488037109375, -0.0010218620300292969, -0.0008630752563476562, -0.0007042884826660156, -0.000545501708984375, -0.0003867149353027344, -0.00022792816162109375, -6.914138793945312e-05, 8.96453857421875e-05, 0.0002484321594238281, 0.00040721893310546875, 0.0005660057067871094, 0.00072479248046875, 0.0008835792541503906, 0.0010423660278320312, 0.0012011528015136719, 0.0013599395751953125, 0.0015187263488769531, 0.0016775131225585938, 0.0018362998962402344, 0.001995086669921875, 0.0021538734436035156, 0.0023126602172851562, 0.002471446990966797, 0.0026302337646484375, 0.002789020538330078, 0.0029478073120117188, 0.0031065940856933594, 0.003265380859375, 0.0034241676330566406, 0.0035829544067382812, 0.003741741180419922, 0.0039005279541015625, 0.004059314727783203, 0.004218101501464844, 0.004376888275146484, 0.004535675048828125, 0.004694461822509766, 0.004853248596191406, 0.005012035369873047, 0.0051708221435546875, 0.005329608917236328, 0.005488395690917969, 0.005647182464599609, 0.00580596923828125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 12.0, 10.0, 12.0, 12.0, 23.0, 29.0, 40.0, 50.0, 71.0, 85.0, 119.0, 209.0, 451.0, 1999.0, 971367.0, 72199.0, 931.0, 264.0, 191.0, 119.0, 79.0, 66.0, 46.0, 40.0, 32.0, 21.0, 18.0, 8.0, 10.0, 9.0, 2.0, 4.0, 1.0, 9.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12060546875, -0.11723613739013672, -0.11386680603027344, -0.11049747467041016, -0.10712814331054688, -0.1037588119506836, -0.10038948059082031, -0.09702014923095703, -0.09365081787109375, -0.09028148651123047, -0.08691215515136719, -0.0835428237915039, -0.08017349243164062, -0.07680416107177734, -0.07343482971191406, -0.07006549835205078, -0.0666961669921875, -0.06332683563232422, -0.05995750427246094, -0.056588172912597656, -0.053218841552734375, -0.049849510192871094, -0.04648017883300781, -0.04311084747314453, -0.03974151611328125, -0.03637218475341797, -0.03300285339355469, -0.029633522033691406, -0.026264190673828125, -0.022894859313964844, -0.019525527954101562, -0.01615619659423828, -0.012786865234375, -0.009417533874511719, -0.0060482025146484375, -0.0026788711547851562, 0.000690460205078125, 0.004059791564941406, 0.0074291229248046875, 0.010798454284667969, 0.01416778564453125, 0.01753711700439453, 0.020906448364257812, 0.024275779724121094, 0.027645111083984375, 0.031014442443847656, 0.03438377380371094, 0.03775310516357422, 0.0411224365234375, 0.04449176788330078, 0.04786109924316406, 0.051230430603027344, 0.054599761962890625, 0.057969093322753906, 0.06133842468261719, 0.06470775604248047, 0.06807708740234375, 0.07144641876220703, 0.07481575012207031, 0.0781850814819336, 0.08155441284179688, 0.08492374420166016, 0.08829307556152344, 0.09166240692138672, 0.09503173828125]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 27.0, 633.0, 342.0, 13.0, 3.0, 0.0, 1.0], "bins": [-0.04584449157118797, -0.04506592079997063, -0.04428735002875328, -0.043508779257535934, -0.04273020848631859, -0.04195163771510124, -0.041173066943883896, -0.04039449617266655, -0.039615925401449203, -0.03883735463023186, -0.03805878385901451, -0.037280213087797165, -0.03650164231657982, -0.03572307154536247, -0.034944500774145126, -0.03416593000292778, -0.033387359231710434, -0.03260878846049309, -0.03183021768927574, -0.031051646918058395, -0.03027307614684105, -0.029494505375623703, -0.028715934604406357, -0.02793736383318901, -0.027158793061971664, -0.026380222290754318, -0.025601651519536972, -0.024823080748319626, -0.02404450997710228, -0.023265939205884933, -0.022487368434667587, -0.02170879766345024, -0.020930228754878044, -0.020151657983660698, -0.019373087212443352, -0.018594516441226006, -0.01781594567000866, -0.017037374898791313, -0.016258804127573967, -0.01548023335635662, -0.014701662585139275, -0.013923091813921928, -0.013144521042704582, -0.012365950271487236, -0.01158737950026989, -0.010808808729052544, -0.010030237957835197, -0.009251667186617851, -0.008473096415400505, -0.007694525644183159, -0.006915954872965813, -0.0061373841017484665, -0.00535881333053112, -0.004580242559313774, -0.003801671788096428, -0.0030231010168790817, -0.0022445302456617355, -0.0014659594744443893, -0.0006873887032270432, 9.118206799030304e-05, 0.0008697528392076492, 0.0016483236104249954, 0.0024268943816423416, 0.003205465152859688, 0.003984035924077034]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 3.0, 7.0, 9.0, 7.0, 8.0, 10.0, 22.0, 17.0, 24.0, 17.0, 27.0, 30.0, 30.0, 47.0, 39.0, 48.0, 33.0, 43.0, 33.0, 41.0, 34.0, 47.0, 47.0, 47.0, 41.0, 37.0, 37.0, 32.0, 20.0, 29.0, 17.0, 18.0, 20.0, 15.0, 10.0, 9.0, 5.0, 6.0, 11.0, 8.0, 8.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0027136802673339844, -0.0026338156312704086, -0.002553950995206833, -0.002474086359143257, -0.0023942217230796814, -0.0023143570870161057, -0.00223449245095253, -0.002154627814888954, -0.0020747631788253784, -0.0019948985427618027, -0.001915033906698227, -0.0018351692706346512, -0.0017553046345710754, -0.0016754399985074997, -0.001595575362443924, -0.0015157107263803482, -0.0014358460903167725, -0.0013559814542531967, -0.001276116818189621, -0.0011962521821260452, -0.0011163875460624695, -0.0010365229099988937, -0.000956658273935318, -0.0008767936378717422, -0.0007969290018081665, -0.0007170643657445908, -0.000637199729681015, -0.0005573350936174393, -0.0004774704575538635, -0.0003976058214902878, -0.00031774118542671204, -0.0002378765493631363, -0.00015801191329956055, -7.81472772359848e-05, 1.7173588275909424e-06, 8.158199489116669e-05, 0.00016144663095474243, 0.00024131126701831818, 0.0003211759030818939, 0.00040104053914546967, 0.0004809051752090454, 0.0005607698112726212, 0.0006406344473361969, 0.0007204990833997726, 0.0008003637194633484, 0.0008802283555269241, 0.0009600929915904999, 0.0010399576276540756, 0.0011198222637176514, 0.0011996868997812271, 0.0012795515358448029, 0.0013594161719083786, 0.0014392808079719543, 0.00151914544403553, 0.0015990100800991058, 0.0016788747161626816, 0.0017587393522262573, 0.001838603988289833, 0.0019184686243534088, 0.0019983332604169846, 0.0020781978964805603, 0.002158062532544136, 0.002237927168607712, 0.0023177918046712875, 0.0023976564407348633]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 5.0, 4.0, 3.0, 6.0, 11.0, 11.0, 7.0, 13.0, 19.0, 20.0, 19.0, 23.0, 44.0, 40.0, 45.0, 52.0, 64.0, 37.0, 59.0, 49.0, 50.0, 48.0, 47.0, 35.0, 39.0, 44.0, 30.0, 35.0, 32.0, 16.0, 16.0, 15.0, 24.0, 8.0, 12.0, 10.0, 5.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-25.953125, -25.22607421875, -24.4990234375, -23.77197265625, -23.044921875, -22.31787109375, -21.5908203125, -20.86376953125, -20.13671875, -19.40966796875, -18.6826171875, -17.95556640625, -17.228515625, -16.50146484375, -15.7744140625, -15.04736328125, -14.3203125, -13.59326171875, -12.8662109375, -12.13916015625, -11.412109375, -10.68505859375, -9.9580078125, -9.23095703125, -8.50390625, -7.77685546875, -7.0498046875, -6.32275390625, -5.595703125, -4.86865234375, -4.1416015625, -3.41455078125, -2.6875, -1.96044921875, -1.2333984375, -0.50634765625, 0.220703125, 0.94775390625, 1.6748046875, 2.40185546875, 3.12890625, 3.85595703125, 4.5830078125, 5.31005859375, 6.037109375, 6.76416015625, 7.4912109375, 8.21826171875, 8.9453125, 9.67236328125, 10.3994140625, 11.12646484375, 11.853515625, 12.58056640625, 13.3076171875, 14.03466796875, 14.76171875, 15.48876953125, 16.2158203125, 16.94287109375, 17.669921875, 18.39697265625, 19.1240234375, 19.85107421875, 20.578125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 8.0, 9.0, 8.0, 19.0, 25.0, 23.0, 52.0, 74.0, 95.0, 150.0, 283.0, 507.0, 822.0, 1455.0, 2772.0, 5586.0, 13533.0, 40065.0, 183149.0, 614391.0, 131672.0, 32133.0, 11371.0, 4782.0, 2439.0, 1268.0, 681.0, 451.0, 261.0, 161.0, 99.0, 66.0, 54.0, 22.0, 32.0, 16.0, 9.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.734375, -22.09228515625, -21.4501953125, -20.80810546875, -20.166015625, -19.52392578125, -18.8818359375, -18.23974609375, -17.59765625, -16.95556640625, -16.3134765625, -15.67138671875, -15.029296875, -14.38720703125, -13.7451171875, -13.10302734375, -12.4609375, -11.81884765625, -11.1767578125, -10.53466796875, -9.892578125, -9.25048828125, -8.6083984375, -7.96630859375, -7.32421875, -6.68212890625, -6.0400390625, -5.39794921875, -4.755859375, -4.11376953125, -3.4716796875, -2.82958984375, -2.1875, -1.54541015625, -0.9033203125, -0.26123046875, 0.380859375, 1.02294921875, 1.6650390625, 2.30712890625, 2.94921875, 3.59130859375, 4.2333984375, 4.87548828125, 5.517578125, 6.15966796875, 6.8017578125, 7.44384765625, 8.0859375, 8.72802734375, 9.3701171875, 10.01220703125, 10.654296875, 11.29638671875, 11.9384765625, 12.58056640625, 13.22265625, 13.86474609375, 14.5068359375, 15.14892578125, 15.791015625, 16.43310546875, 17.0751953125, 17.71728515625, 18.359375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 5.0, 5.0, 12.0, 14.0, 15.0, 21.0, 18.0, 20.0, 25.0, 24.0, 34.0, 46.0, 36.0, 34.0, 39.0, 61.0, 98.0, 1770.0, 268.0, 79.0, 48.0, 41.0, 35.0, 42.0, 36.0, 34.0, 23.0, 26.0, 21.0, 23.0, 14.0, 12.0, 11.0, 6.0, 7.0, 13.0, 3.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-72.875, -70.83740234375, -68.7998046875, -66.76220703125, -64.724609375, -62.68701171875, -60.6494140625, -58.61181640625, -56.57421875, -54.53662109375, -52.4990234375, -50.46142578125, -48.423828125, -46.38623046875, -44.3486328125, -42.31103515625, -40.2734375, -38.23583984375, -36.1982421875, -34.16064453125, -32.123046875, -30.08544921875, -28.0478515625, -26.01025390625, -23.97265625, -21.93505859375, -19.8974609375, -17.85986328125, -15.822265625, -13.78466796875, -11.7470703125, -9.70947265625, -7.671875, -5.63427734375, -3.5966796875, -1.55908203125, 0.478515625, 2.51611328125, 4.5537109375, 6.59130859375, 8.62890625, 10.66650390625, 12.7041015625, 14.74169921875, 16.779296875, 18.81689453125, 20.8544921875, 22.89208984375, 24.9296875, 26.96728515625, 29.0048828125, 31.04248046875, 33.080078125, 35.11767578125, 37.1552734375, 39.19287109375, 41.23046875, 43.26806640625, 45.3056640625, 47.34326171875, 49.380859375, 51.41845703125, 53.4560546875, 55.49365234375, 57.53125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 6.0, 10.0, 9.0, 10.0, 11.0, 25.0, 12.0, 18.0, 46.0, 51.0, 64.0, 83.0, 97.0, 143.0, 217.0, 378.0, 1133.0, 9705.0, 2879435.0, 247896.0, 4534.0, 770.0, 292.0, 175.0, 156.0, 87.0, 74.0, 63.0, 44.0, 33.0, 34.0, 17.0, 20.0, 10.0, 8.0, 14.0, 7.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-111.5, -107.8876953125, -104.275390625, -100.6630859375, -97.05078125, -93.4384765625, -89.826171875, -86.2138671875, -82.6015625, -78.9892578125, -75.376953125, -71.7646484375, -68.15234375, -64.5400390625, -60.927734375, -57.3154296875, -53.703125, -50.0908203125, -46.478515625, -42.8662109375, -39.25390625, -35.6416015625, -32.029296875, -28.4169921875, -24.8046875, -21.1923828125, -17.580078125, -13.9677734375, -10.35546875, -6.7431640625, -3.130859375, 0.4814453125, 4.09375, 7.7060546875, 11.318359375, 14.9306640625, 18.54296875, 22.1552734375, 25.767578125, 29.3798828125, 32.9921875, 36.6044921875, 40.216796875, 43.8291015625, 47.44140625, 51.0537109375, 54.666015625, 58.2783203125, 61.890625, 65.5029296875, 69.115234375, 72.7275390625, 76.33984375, 79.9521484375, 83.564453125, 87.1767578125, 90.7890625, 94.4013671875, 98.013671875, 101.6259765625, 105.23828125, 108.8505859375, 112.462890625, 116.0751953125, 119.6875]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 13.0, 156.0, 649.0, 180.0, 20.0], "bins": [-574.3106689453125, -564.9722900390625, -555.6339111328125, -546.2955322265625, -536.9571533203125, -527.6188354492188, -518.2804565429688, -508.94207763671875, -499.60369873046875, -490.26531982421875, -480.92694091796875, -471.5885925292969, -462.2502136230469, -452.9118347167969, -443.5734558105469, -434.235107421875, -424.896728515625, -415.558349609375, -406.219970703125, -396.8816223144531, -387.5432434082031, -378.2048645019531, -368.8664855957031, -359.52813720703125, -350.1897277832031, -340.8513488769531, -331.5129699707031, -322.17462158203125, -312.83624267578125, -303.49786376953125, -294.15948486328125, -284.82110595703125, -275.4827575683594, -266.1443786621094, -256.8059997558594, -247.46763610839844, -238.1292724609375, -228.7908935546875, -219.4525146484375, -210.11415100097656, -200.77578735351562, -191.43740844726562, -182.0990447998047, -172.7606658935547, -163.42230224609375, -154.08392333984375, -144.74554443359375, -135.4071807861328, -126.06880187988281, -116.73043060302734, -107.39205932617188, -98.05368041992188, -88.71531677246094, -79.37693786621094, -70.03856658935547, -60.7001953125, -51.36182403564453, -42.02345275878906, -32.685081481933594, -23.34670639038086, -14.00833511352539, -4.669963836669922, 4.6684112548828125, 14.006782531738281, 23.34515380859375]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 6.0, 3.0, 8.0, 6.0, 3.0, 8.0, 13.0, 25.0, 20.0, 15.0, 15.0, 20.0, 20.0, 29.0, 25.0, 39.0, 42.0, 47.0, 46.0, 52.0, 46.0, 50.0, 42.0, 41.0, 49.0, 44.0, 33.0, 33.0, 25.0, 32.0, 28.0, 20.0, 16.0, 20.0, 16.0, 10.0, 12.0, 9.0, 9.0, 4.0, 7.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.85232543945312, -142.83575439453125, -137.81919860839844, -132.80262756347656, -127.78605651855469, -122.76949310302734, -117.7529296875, -112.73635864257812, -107.71979522705078, -102.70323181152344, -97.68666076660156, -92.67009735107422, -87.65353393554688, -82.636962890625, -77.62039947509766, -72.60383605957031, -67.58726501464844, -62.57069778442383, -57.55413055419922, -52.537567138671875, -47.520999908447266, -42.504432678222656, -37.48786926269531, -32.4713020324707, -27.454734802246094, -22.438167572021484, -17.421602249145508, -12.405035972595215, -7.388469696044922, -2.3719024658203125, 2.644662857055664, 7.661228179931641, 12.677780151367188, 17.694347381591797, 22.710912704467773, 27.72747802734375, 32.74404525756836, 37.76061248779297, 42.77717590332031, 47.79374313354492, 52.81031036376953, 57.82687759399414, 62.84344482421875, 67.8600082397461, 72.87657165527344, 77.89314270019531, 82.90970611572266, 87.92626953125, 92.94284057617188, 97.95940399169922, 102.9759750366211, 107.99253845214844, 113.00910949707031, 118.02567291259766, 123.042236328125, 128.05880737304688, 133.07537841796875, 138.09194946289062, 143.10850524902344, 148.1250762939453, 153.1416473388672, 158.158203125, 163.17477416992188, 168.19134521484375, 173.20790100097656]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 6.0, 11.0, 7.0, 15.0, 12.0, 13.0, 15.0, 20.0, 29.0, 20.0, 32.0, 46.0, 43.0, 44.0, 51.0, 44.0, 44.0, 64.0, 56.0, 40.0, 49.0, 43.0, 32.0, 34.0, 31.0, 29.0, 31.0, 27.0, 18.0, 17.0, 17.0, 22.0, 10.0, 8.0, 3.0, 11.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.21875, -24.494384765625, -23.77001953125, -23.045654296875, -22.3212890625, -21.596923828125, -20.87255859375, -20.148193359375, -19.423828125, -18.699462890625, -17.97509765625, -17.250732421875, -16.5263671875, -15.802001953125, -15.07763671875, -14.353271484375, -13.62890625, -12.904541015625, -12.18017578125, -11.455810546875, -10.7314453125, -10.007080078125, -9.28271484375, -8.558349609375, -7.833984375, -7.109619140625, -6.38525390625, -5.660888671875, -4.9365234375, -4.212158203125, -3.48779296875, -2.763427734375, -2.0390625, -1.314697265625, -0.59033203125, 0.134033203125, 0.8583984375, 1.582763671875, 2.30712890625, 3.031494140625, 3.755859375, 4.480224609375, 5.20458984375, 5.928955078125, 6.6533203125, 7.377685546875, 8.10205078125, 8.826416015625, 9.55078125, 10.275146484375, 10.99951171875, 11.723876953125, 12.4482421875, 13.172607421875, 13.89697265625, 14.621337890625, 15.345703125, 16.070068359375, 16.79443359375, 17.518798828125, 18.2431640625, 18.967529296875, 19.69189453125, 20.416259765625, 21.140625]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 6.0, 10.0, 12.0, 20.0, 13.0, 17.0, 29.0, 55.0, 51.0, 94.0, 189.0, 278.0, 578.0, 1151.0, 2711.0, 7447.0, 41354.0, 2869239.0, 1235455.0, 25145.0, 5836.0, 2364.0, 1008.0, 514.0, 264.0, 150.0, 88.0, 62.0, 28.0, 27.0, 24.0, 19.0, 16.0, 9.0, 4.0, 3.0, 4.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-79.9375, -77.646484375, -75.35546875, -73.064453125, -70.7734375, -68.482421875, -66.19140625, -63.900390625, -61.609375, -59.318359375, -57.02734375, -54.736328125, -52.4453125, -50.154296875, -47.86328125, -45.572265625, -43.28125, -40.990234375, -38.69921875, -36.408203125, -34.1171875, -31.826171875, -29.53515625, -27.244140625, -24.953125, -22.662109375, -20.37109375, -18.080078125, -15.7890625, -13.498046875, -11.20703125, -8.916015625, -6.625, -4.333984375, -2.04296875, 0.248046875, 2.5390625, 4.830078125, 7.12109375, 9.412109375, 11.703125, 13.994140625, 16.28515625, 18.576171875, 20.8671875, 23.158203125, 25.44921875, 27.740234375, 30.03125, 32.322265625, 34.61328125, 36.904296875, 39.1953125, 41.486328125, 43.77734375, 46.068359375, 48.359375, 50.650390625, 52.94140625, 55.232421875, 57.5234375, 59.814453125, 62.10546875, 64.396484375, 66.6875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 4.0, 4.0, 7.0, 3.0, 6.0, 12.0, 8.0, 10.0, 24.0, 28.0, 32.0, 42.0, 75.0, 147.0, 228.0, 394.0, 725.0, 883.0, 583.0, 352.0, 191.0, 112.0, 49.0, 43.0, 20.0, 17.0, 13.0, 11.0, 7.0, 9.0, 8.0, 7.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.375, -38.11767578125, -36.8603515625, -35.60302734375, -34.345703125, -33.08837890625, -31.8310546875, -30.57373046875, -29.31640625, -28.05908203125, -26.8017578125, -25.54443359375, -24.287109375, -23.02978515625, -21.7724609375, -20.51513671875, -19.2578125, -18.00048828125, -16.7431640625, -15.48583984375, -14.228515625, -12.97119140625, -11.7138671875, -10.45654296875, -9.19921875, -7.94189453125, -6.6845703125, -5.42724609375, -4.169921875, -2.91259765625, -1.6552734375, -0.39794921875, 0.859375, 2.11669921875, 3.3740234375, 4.63134765625, 5.888671875, 7.14599609375, 8.4033203125, 9.66064453125, 10.91796875, 12.17529296875, 13.4326171875, 14.68994140625, 15.947265625, 17.20458984375, 18.4619140625, 19.71923828125, 20.9765625, 22.23388671875, 23.4912109375, 24.74853515625, 26.005859375, 27.26318359375, 28.5205078125, 29.77783203125, 31.03515625, 32.29248046875, 33.5498046875, 34.80712890625, 36.064453125, 37.32177734375, 38.5791015625, 39.83642578125, 41.09375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 3.0, 4.0, 8.0, 10.0, 14.0, 21.0, 19.0, 29.0, 50.0, 55.0, 90.0, 228.0, 466.0, 1245.0, 3729.0, 14651.0, 117863.0, 3922000.0, 113447.0, 14431.0, 3627.0, 1220.0, 485.0, 202.0, 144.0, 69.0, 46.0, 29.0, 22.0, 24.0, 8.0, 14.0, 9.0, 4.0, 5.0, 3.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-116.9375, -113.224609375, -109.51171875, -105.798828125, -102.0859375, -98.373046875, -94.66015625, -90.947265625, -87.234375, -83.521484375, -79.80859375, -76.095703125, -72.3828125, -68.669921875, -64.95703125, -61.244140625, -57.53125, -53.818359375, -50.10546875, -46.392578125, -42.6796875, -38.966796875, -35.25390625, -31.541015625, -27.828125, -24.115234375, -20.40234375, -16.689453125, -12.9765625, -9.263671875, -5.55078125, -1.837890625, 1.875, 5.587890625, 9.30078125, 13.013671875, 16.7265625, 20.439453125, 24.15234375, 27.865234375, 31.578125, 35.291015625, 39.00390625, 42.716796875, 46.4296875, 50.142578125, 53.85546875, 57.568359375, 61.28125, 64.994140625, 68.70703125, 72.419921875, 76.1328125, 79.845703125, 83.55859375, 87.271484375, 90.984375, 94.697265625, 98.41015625, 102.123046875, 105.8359375, 109.548828125, 113.26171875, 116.974609375, 120.6875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 14.0, 16.0, 27.0, 49.0, 68.0, 142.0, 167.0, 186.0, 115.0, 87.0, 62.0, 34.0, 15.0, 11.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-208.77386474609375, -203.14276123046875, -197.51165771484375, -191.88055419921875, -186.24945068359375, -180.61834716796875, -174.98724365234375, -169.35614013671875, -163.72503662109375, -158.09393310546875, -152.46282958984375, -146.83172607421875, -141.20062255859375, -135.56951904296875, -129.93841552734375, -124.30730438232422, -118.67619323730469, -113.04508972167969, -107.41398620605469, -101.78288269042969, -96.15177917480469, -90.52067565917969, -84.88956451416016, -79.25846099853516, -73.62735748291016, -67.99625396728516, -62.365150451660156, -56.73404312133789, -51.10293960571289, -45.47183609008789, -39.840728759765625, -34.209625244140625, -28.578536987304688, -22.947433471679688, -17.316328048706055, -11.685222625732422, -6.054119110107422, -0.4230155944824219, 5.208091735839844, 10.839195251464844, 16.470298767089844, 22.101402282714844, 27.732507705688477, 33.36361312866211, 38.99471664428711, 44.62582015991211, 50.256927490234375, 55.888031005859375, 61.519134521484375, 67.15023803710938, 72.78134155273438, 78.41244506835938, 84.04354858398438, 89.67465209960938, 95.3057632446289, 100.9368667602539, 106.5679702758789, 112.1990737915039, 117.8301773071289, 123.46128845214844, 129.09239196777344, 134.72349548339844, 140.35459899902344, 145.98570251464844, 151.61680603027344]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 7.0, 6.0, 7.0, 6.0, 10.0, 13.0, 11.0, 22.0, 12.0, 21.0, 22.0, 26.0, 25.0, 23.0, 33.0, 35.0, 29.0, 32.0, 48.0, 48.0, 38.0, 43.0, 48.0, 28.0, 37.0, 34.0, 36.0, 29.0, 44.0, 29.0, 29.0, 33.0, 16.0, 30.0, 8.0, 15.0, 12.0, 6.0, 8.0, 9.0, 8.0, 5.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-97.0870361328125, -93.92354583740234, -90.76005554199219, -87.59656524658203, -84.43307495117188, -81.26957702636719, -78.10608673095703, -74.94259643554688, -71.77910614013672, -68.61561584472656, -65.4521255493164, -62.288631439208984, -59.12514114379883, -55.96165084838867, -52.79815673828125, -49.634666442871094, -46.47117614746094, -43.30768585205078, -40.144195556640625, -36.9807014465332, -33.81721115112305, -30.65372085571289, -27.4902286529541, -24.326736450195312, -21.163246154785156, -17.999755859375, -14.836263656616211, -11.672772407531738, -8.509281158447266, -5.345789909362793, -2.1822986602783203, 0.9811935424804688, 4.144683837890625, 7.308175086975098, 10.47166633605957, 13.635157585144043, 16.798648834228516, 19.962139129638672, 23.12563133239746, 26.28912353515625, 29.452613830566406, 32.61610412597656, 35.77959442138672, 38.94308853149414, 42.1065788269043, 45.27006912231445, 48.433563232421875, 51.59705352783203, 54.76054382324219, 57.924034118652344, 61.0875244140625, 64.25101470947266, 67.41450500488281, 70.5780029296875, 73.74149322509766, 76.90498352050781, 80.06847381591797, 83.23196411132812, 86.39545440673828, 89.55894470214844, 92.72244262695312, 95.88593292236328, 99.04942321777344, 102.2129135131836, 105.37640380859375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 7.0, 5.0, 8.0, 7.0, 10.0, 16.0, 23.0, 13.0, 16.0, 28.0, 23.0, 40.0, 37.0, 45.0, 43.0, 34.0, 44.0, 40.0, 52.0, 49.0, 46.0, 28.0, 32.0, 40.0, 51.0, 32.0, 32.0, 25.0, 30.0, 19.0, 29.0, 13.0, 11.0, 10.0, 18.0, 17.0, 8.0, 10.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.046875, -22.3515625, -21.65625, -20.9609375, -20.265625, -19.5703125, -18.875, -18.1796875, -17.484375, -16.7890625, -16.09375, -15.3984375, -14.703125, -14.0078125, -13.3125, -12.6171875, -11.921875, -11.2265625, -10.53125, -9.8359375, -9.140625, -8.4453125, -7.75, -7.0546875, -6.359375, -5.6640625, -4.96875, -4.2734375, -3.578125, -2.8828125, -2.1875, -1.4921875, -0.796875, -0.1015625, 0.59375, 1.2890625, 1.984375, 2.6796875, 3.375, 4.0703125, 4.765625, 5.4609375, 6.15625, 6.8515625, 7.546875, 8.2421875, 8.9375, 9.6328125, 10.328125, 11.0234375, 11.71875, 12.4140625, 13.109375, 13.8046875, 14.5, 15.1953125, 15.890625, 16.5859375, 17.28125, 17.9765625, 18.671875, 19.3671875, 20.0625, 20.7578125, 21.453125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 9.0, 9.0, 26.0, 27.0, 43.0, 68.0, 112.0, 146.0, 257.0, 369.0, 581.0, 921.0, 1455.0, 2288.0, 3658.0, 5969.0, 9502.0, 15624.0, 25489.0, 43836.0, 80223.0, 163193.0, 290171.0, 189440.0, 92019.0, 49231.0, 28379.0, 17357.0, 10666.0, 6501.0, 4015.0, 2584.0, 1598.0, 984.0, 678.0, 392.0, 244.0, 185.0, 99.0, 63.0, 49.0, 33.0, 27.0, 8.0, 7.0, 9.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.01953125, -1.95562744140625, -1.8917236328125, -1.82781982421875, -1.763916015625, -1.70001220703125, -1.6361083984375, -1.57220458984375, -1.50830078125, -1.44439697265625, -1.3804931640625, -1.31658935546875, -1.252685546875, -1.18878173828125, -1.1248779296875, -1.06097412109375, -0.9970703125, -0.93316650390625, -0.8692626953125, -0.80535888671875, -0.741455078125, -0.67755126953125, -0.6136474609375, -0.54974365234375, -0.48583984375, -0.42193603515625, -0.3580322265625, -0.29412841796875, -0.230224609375, -0.16632080078125, -0.1024169921875, -0.03851318359375, 0.025390625, 0.08929443359375, 0.1531982421875, 0.21710205078125, 0.281005859375, 0.34490966796875, 0.4088134765625, 0.47271728515625, 0.53662109375, 0.60052490234375, 0.6644287109375, 0.72833251953125, 0.792236328125, 0.85614013671875, 0.9200439453125, 0.98394775390625, 1.0478515625, 1.11175537109375, 1.1756591796875, 1.23956298828125, 1.303466796875, 1.36737060546875, 1.4312744140625, 1.49517822265625, 1.55908203125, 1.62298583984375, 1.6868896484375, 1.75079345703125, 1.814697265625, 1.87860107421875, 1.9425048828125, 2.00640869140625, 2.0703125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 6.0, 15.0, 13.0, 15.0, 20.0, 22.0, 18.0, 22.0, 24.0, 25.0, 22.0, 26.0, 28.0, 26.0, 39.0, 27.0, 47.0, 30.0, 1060.0, 38.0, 42.0, 41.0, 39.0, 43.0, 30.0, 36.0, 28.0, 30.0, 27.0, 22.0, 19.0, 21.0, 13.0, 16.0, 10.0, 10.0, 13.0, 13.0, 4.0, 5.0, 8.0, 4.0, 2.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0], "bins": [-13.21875, -12.8275146484375, -12.436279296875, -12.0450439453125, -11.65380859375, -11.2625732421875, -10.871337890625, -10.4801025390625, -10.0888671875, -9.6976318359375, -9.306396484375, -8.9151611328125, -8.52392578125, -8.1326904296875, -7.741455078125, -7.3502197265625, -6.958984375, -6.5677490234375, -6.176513671875, -5.7852783203125, -5.39404296875, -5.0028076171875, -4.611572265625, -4.2203369140625, -3.8291015625, -3.4378662109375, -3.046630859375, -2.6553955078125, -2.26416015625, -1.8729248046875, -1.481689453125, -1.0904541015625, -0.69921875, -0.3079833984375, 0.083251953125, 0.4744873046875, 0.86572265625, 1.2569580078125, 1.648193359375, 2.0394287109375, 2.4306640625, 2.8218994140625, 3.213134765625, 3.6043701171875, 3.99560546875, 4.3868408203125, 4.778076171875, 5.1693115234375, 5.560546875, 5.9517822265625, 6.343017578125, 6.7342529296875, 7.12548828125, 7.5167236328125, 7.907958984375, 8.2991943359375, 8.6904296875, 9.0816650390625, 9.472900390625, 9.8641357421875, 10.25537109375, 10.6466064453125, 11.037841796875, 11.4290771484375, 11.8203125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 10.0, 14.0, 16.0, 19.0, 30.0, 58.0, 69.0, 121.0, 172.0, 245.0, 407.0, 608.0, 1086.0, 1808.0, 2984.0, 5011.0, 8204.0, 14380.0, 25270.0, 44918.0, 85487.0, 184769.0, 1377734.0, 166132.0, 79172.0, 41924.0, 23496.0, 13238.0, 7877.0, 4707.0, 2770.0, 1635.0, 1001.0, 652.0, 390.0, 228.0, 170.0, 105.0, 64.0, 48.0, 44.0, 16.0, 14.0, 10.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.04296875, -1.97357177734375, -1.9041748046875, -1.83477783203125, -1.765380859375, -1.69598388671875, -1.6265869140625, -1.55718994140625, -1.48779296875, -1.41839599609375, -1.3489990234375, -1.27960205078125, -1.210205078125, -1.14080810546875, -1.0714111328125, -1.00201416015625, -0.9326171875, -0.86322021484375, -0.7938232421875, -0.72442626953125, -0.655029296875, -0.58563232421875, -0.5162353515625, -0.44683837890625, -0.37744140625, -0.30804443359375, -0.2386474609375, -0.16925048828125, -0.099853515625, -0.03045654296875, 0.0389404296875, 0.10833740234375, 0.177734375, 0.24713134765625, 0.3165283203125, 0.38592529296875, 0.455322265625, 0.52471923828125, 0.5941162109375, 0.66351318359375, 0.73291015625, 0.80230712890625, 0.8717041015625, 0.94110107421875, 1.010498046875, 1.07989501953125, 1.1492919921875, 1.21868896484375, 1.2880859375, 1.35748291015625, 1.4268798828125, 1.49627685546875, 1.565673828125, 1.63507080078125, 1.7044677734375, 1.77386474609375, 1.84326171875, 1.91265869140625, 1.9820556640625, 2.05145263671875, 2.120849609375, 2.19024658203125, 2.2596435546875, 2.32904052734375, 2.3984375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 4.0, 6.0, 3.0, 11.0, 12.0, 22.0, 18.0, 30.0, 30.0, 36.0, 55.0, 46.0, 76.0, 85.0, 68.0, 63.0, 88.0, 67.0, 53.0, 31.0, 37.0, 30.0, 22.0, 31.0, 18.0, 13.0, 5.0, 11.0, 9.0, 3.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006443023681640625, -0.006241738796234131, -0.006040453910827637, -0.005839169025421143, -0.0056378841400146484, -0.005436599254608154, -0.00523531436920166, -0.005034029483795166, -0.004832744598388672, -0.004631459712982178, -0.004430174827575684, -0.0042288899421691895, -0.004027605056762695, -0.003826320171356201, -0.003625035285949707, -0.003423750400543213, -0.0032224655151367188, -0.0030211806297302246, -0.0028198957443237305, -0.0026186108589172363, -0.002417325973510742, -0.002216041088104248, -0.002014756202697754, -0.0018134713172912598, -0.0016121864318847656, -0.0014109015464782715, -0.0012096166610717773, -0.0010083317756652832, -0.0008070468902587891, -0.0006057620048522949, -0.0004044771194458008, -0.00020319223403930664, -1.9073486328125e-06, 0.00019937753677368164, 0.0004006624221801758, 0.0006019473075866699, 0.0008032321929931641, 0.0010045170783996582, 0.0012058019638061523, 0.0014070868492126465, 0.0016083717346191406, 0.0018096566200256348, 0.002010941505432129, 0.002212226390838623, 0.002413511276245117, 0.0026147961616516113, 0.0028160810470581055, 0.0030173659324645996, 0.0032186508178710938, 0.003419935703277588, 0.003621220588684082, 0.003822505474090576, 0.00402379035949707, 0.0042250752449035645, 0.004426360130310059, 0.004627645015716553, 0.004828929901123047, 0.005030214786529541, 0.005231499671936035, 0.005432784557342529, 0.0056340694427490234, 0.005835354328155518, 0.006036639213562012, 0.006237924098968506, 0.006439208984375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 5.0, 9.0, 9.0, 12.0, 23.0, 20.0, 33.0, 45.0, 46.0, 84.0, 93.0, 148.0, 253.0, 669.0, 9602.0, 1031036.0, 5090.0, 573.0, 272.0, 143.0, 104.0, 79.0, 45.0, 43.0, 27.0, 23.0, 15.0, 10.0, 6.0, 7.0, 2.0, 7.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1336669921875, -0.129547119140625, -0.12542724609375, -0.121307373046875, -0.1171875, -0.113067626953125, -0.10894775390625, -0.104827880859375, -0.1007080078125, -0.096588134765625, -0.09246826171875, -0.088348388671875, -0.084228515625, -0.080108642578125, -0.07598876953125, -0.071868896484375, -0.0677490234375, -0.063629150390625, -0.05950927734375, -0.055389404296875, -0.05126953125, -0.047149658203125, -0.04302978515625, -0.038909912109375, -0.0347900390625, -0.030670166015625, -0.02655029296875, -0.022430419921875, -0.018310546875, -0.014190673828125, -0.01007080078125, -0.005950927734375, -0.0018310546875, 0.002288818359375, 0.00640869140625, 0.010528564453125, 0.0146484375, 0.018768310546875, 0.02288818359375, 0.027008056640625, 0.0311279296875, 0.035247802734375, 0.03936767578125, 0.043487548828125, 0.047607421875, 0.051727294921875, 0.05584716796875, 0.059967041015625, 0.0640869140625, 0.068206787109375, 0.07232666015625, 0.076446533203125, 0.08056640625, 0.084686279296875, 0.08880615234375, 0.092926025390625, 0.0970458984375, 0.101165771484375, 0.10528564453125, 0.109405517578125, 0.113525390625, 0.117645263671875, 0.12176513671875, 0.125885009765625, 0.1300048828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 16.0, 36.0, 97.0, 212.0, 319.0, 205.0, 67.0, 33.0, 13.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01027259323745966, -0.010036296211183071, -0.009800000116229057, -0.009563703089952469, -0.00932740606367588, -0.009091109968721867, -0.008854812942445278, -0.008618516847491264, -0.008382219821214676, -0.008145922794938087, -0.007909626699984074, -0.007673329673707485, -0.007437033113092184, -0.007200736552476883, -0.0069644395262002945, -0.006728142965584993, -0.006491846404969692, -0.006255549844354391, -0.00601925328373909, -0.0057829562574625015, -0.0055466596968472, -0.005310363136231899, -0.005074066109955311, -0.00483776954934001, -0.0046014729887247086, -0.004365176428109407, -0.004128879867494106, -0.003892582841217518, -0.0036562862806022167, -0.0034199897199869156, -0.003183692926540971, -0.002947396133095026, -0.002711100038141012, -0.002474803477525711, -0.0022385066840797663, -0.0020022098906338215, -0.0017659133300185204, -0.0015296166529878974, -0.0012933199759572744, -0.0010570232989266515, -0.0008207266218960285, -0.0005844299448654056, -0.0003481332678347826, -0.00011183659080415964, 0.00012446008622646332, 0.0003607567632570863, 0.0005970534402877092, 0.0008333501173183322, 0.0010696467943489552, 0.0013059434713795781, 0.001542240148410201, 0.001778536825440824, 0.002014833502471447, 0.002251130063086748, 0.002487426856532693, 0.0027237236499786377, 0.002960020210593939, 0.00319631677120924, 0.0034326135646551847, 0.0036689103581011295, 0.0039052069187164307, 0.004141503479331732, 0.004377800039947033, 0.004614097066223621, 0.0048503936268389225]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 0.0, 6.0, 3.0, 3.0, 10.0, 13.0, 11.0, 7.0, 19.0, 12.0, 22.0, 13.0, 18.0, 36.0, 28.0, 26.0, 30.0, 25.0, 38.0, 39.0, 31.0, 46.0, 40.0, 42.0, 50.0, 48.0, 29.0, 37.0, 33.0, 32.0, 38.0, 40.0, 22.0, 25.0, 14.0, 22.0, 18.0, 13.0, 15.0, 6.0, 2.0, 6.0, 8.0, 6.0, 6.0, 4.0, 4.0, 4.0, 3.0, 2.0, 6.0], "bins": [-0.0031769275665283203, -0.0030893180519342422, -0.003001708537340164, -0.002914099022746086, -0.002826489508152008, -0.00273887999355793, -0.002651270478963852, -0.002563660964369774, -0.002476051449775696, -0.0023884419351816177, -0.0023008324205875397, -0.0022132229059934616, -0.0021256133913993835, -0.0020380038768053055, -0.0019503943622112274, -0.0018627848476171494, -0.0017751753330230713, -0.0016875658184289932, -0.0015999563038349152, -0.001512346789240837, -0.001424737274646759, -0.001337127760052681, -0.001249518245458603, -0.0011619087308645248, -0.0010742992162704468, -0.0009866897016763687, -0.0008990801870822906, -0.0008114706724882126, -0.0007238611578941345, -0.0006362516433000565, -0.0005486421287059784, -0.00046103261411190033, -0.00037342309951782227, -0.0002858135849237442, -0.00019820407032966614, -0.00011059455573558807, -2.298504114151001e-05, 6.462447345256805e-05, 0.00015223398804664612, 0.00023984350264072418, 0.00032745301723480225, 0.0004150625318288803, 0.0005026720464229584, 0.0005902815610170364, 0.0006778910756111145, 0.0007655005902051926, 0.0008531101047992706, 0.0009407196193933487, 0.0010283291339874268, 0.0011159386485815048, 0.0012035481631755829, 0.001291157677769661, 0.001378767192363739, 0.001466376706957817, 0.0015539862215518951, 0.0016415957361459732, 0.0017292052507400513, 0.0018168147653341293, 0.0019044242799282074, 0.0019920337945222855, 0.0020796433091163635, 0.0021672528237104416, 0.0022548623383045197, 0.0023424718528985977, 0.0024300813674926758]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 7.0, 5.0, 8.0, 7.0, 10.0, 16.0, 23.0, 13.0, 16.0, 28.0, 23.0, 40.0, 37.0, 45.0, 43.0, 34.0, 44.0, 40.0, 52.0, 49.0, 46.0, 28.0, 32.0, 40.0, 51.0, 32.0, 32.0, 25.0, 30.0, 19.0, 29.0, 13.0, 11.0, 10.0, 18.0, 17.0, 8.0, 10.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.046875, -22.3515625, -21.65625, -20.9609375, -20.265625, -19.5703125, -18.875, -18.1796875, -17.484375, -16.7890625, -16.09375, -15.3984375, -14.703125, -14.0078125, -13.3125, -12.6171875, -11.921875, -11.2265625, -10.53125, -9.8359375, -9.140625, -8.4453125, -7.75, -7.0546875, -6.359375, -5.6640625, -4.96875, -4.2734375, -3.578125, -2.8828125, -2.1875, -1.4921875, -0.796875, -0.1015625, 0.59375, 1.2890625, 1.984375, 2.6796875, 3.375, 4.0703125, 4.765625, 5.4609375, 6.15625, 6.8515625, 7.546875, 8.2421875, 8.9375, 9.6328125, 10.328125, 11.0234375, 11.71875, 12.4140625, 13.109375, 13.8046875, 14.5, 15.1953125, 15.890625, 16.5859375, 17.28125, 17.9765625, 18.671875, 19.3671875, 20.0625, 20.7578125, 21.453125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 7.0, 6.0, 9.0, 8.0, 17.0, 18.0, 31.0, 37.0, 55.0, 68.0, 67.0, 122.0, 173.0, 257.0, 374.0, 788.0, 2125.0, 11805.0, 270879.0, 732882.0, 23239.0, 3222.0, 916.0, 434.0, 314.0, 181.0, 136.0, 96.0, 77.0, 35.0, 42.0, 25.0, 16.0, 14.0, 24.0, 20.0, 11.0, 10.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-46.4375, -45.0361328125, -43.634765625, -42.2333984375, -40.83203125, -39.4306640625, -38.029296875, -36.6279296875, -35.2265625, -33.8251953125, -32.423828125, -31.0224609375, -29.62109375, -28.2197265625, -26.818359375, -25.4169921875, -24.015625, -22.6142578125, -21.212890625, -19.8115234375, -18.41015625, -17.0087890625, -15.607421875, -14.2060546875, -12.8046875, -11.4033203125, -10.001953125, -8.6005859375, -7.19921875, -5.7978515625, -4.396484375, -2.9951171875, -1.59375, -0.1923828125, 1.208984375, 2.6103515625, 4.01171875, 5.4130859375, 6.814453125, 8.2158203125, 9.6171875, 11.0185546875, 12.419921875, 13.8212890625, 15.22265625, 16.6240234375, 18.025390625, 19.4267578125, 20.828125, 22.2294921875, 23.630859375, 25.0322265625, 26.43359375, 27.8349609375, 29.236328125, 30.6376953125, 32.0390625, 33.4404296875, 34.841796875, 36.2431640625, 37.64453125, 39.0458984375, 40.447265625, 41.8486328125, 43.25]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 6.0, 7.0, 10.0, 11.0, 9.0, 16.0, 14.0, 21.0, 15.0, 25.0, 36.0, 25.0, 30.0, 36.0, 28.0, 41.0, 54.0, 66.0, 216.0, 1838.0, 82.0, 49.0, 51.0, 42.0, 42.0, 33.0, 37.0, 27.0, 26.0, 28.0, 16.0, 20.0, 10.0, 15.0, 11.0, 9.0, 7.0, 10.0, 4.0, 5.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-78.5625, -76.39794921875, -74.2333984375, -72.06884765625, -69.904296875, -67.73974609375, -65.5751953125, -63.41064453125, -61.24609375, -59.08154296875, -56.9169921875, -54.75244140625, -52.587890625, -50.42333984375, -48.2587890625, -46.09423828125, -43.9296875, -41.76513671875, -39.6005859375, -37.43603515625, -35.271484375, -33.10693359375, -30.9423828125, -28.77783203125, -26.61328125, -24.44873046875, -22.2841796875, -20.11962890625, -17.955078125, -15.79052734375, -13.6259765625, -11.46142578125, -9.296875, -7.13232421875, -4.9677734375, -2.80322265625, -0.638671875, 1.52587890625, 3.6904296875, 5.85498046875, 8.01953125, 10.18408203125, 12.3486328125, 14.51318359375, 16.677734375, 18.84228515625, 21.0068359375, 23.17138671875, 25.3359375, 27.50048828125, 29.6650390625, 31.82958984375, 33.994140625, 36.15869140625, 38.3232421875, 40.48779296875, 42.65234375, 44.81689453125, 46.9814453125, 49.14599609375, 51.310546875, 53.47509765625, 55.6396484375, 57.80419921875, 59.96875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 4.0, 9.0, 6.0, 12.0, 9.0, 17.0, 16.0, 24.0, 18.0, 31.0, 33.0, 50.0, 57.0, 71.0, 112.0, 152.0, 312.0, 923.0, 8423.0, 3109998.0, 22921.0, 1412.0, 403.0, 187.0, 110.0, 84.0, 56.0, 45.0, 43.0, 28.0, 30.0, 19.0, 11.0, 16.0, 13.0, 9.0, 7.0, 8.0, 8.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-140.625, -135.53515625, -130.4453125, -125.35546875, -120.265625, -115.17578125, -110.0859375, -104.99609375, -99.90625, -94.81640625, -89.7265625, -84.63671875, -79.546875, -74.45703125, -69.3671875, -64.27734375, -59.1875, -54.09765625, -49.0078125, -43.91796875, -38.828125, -33.73828125, -28.6484375, -23.55859375, -18.46875, -13.37890625, -8.2890625, -3.19921875, 1.890625, 6.98046875, 12.0703125, 17.16015625, 22.25, 27.33984375, 32.4296875, 37.51953125, 42.609375, 47.69921875, 52.7890625, 57.87890625, 62.96875, 68.05859375, 73.1484375, 78.23828125, 83.328125, 88.41796875, 93.5078125, 98.59765625, 103.6875, 108.77734375, 113.8671875, 118.95703125, 124.046875, 129.13671875, 134.2265625, 139.31640625, 144.40625, 149.49609375, 154.5859375, 159.67578125, 164.765625, 169.85546875, 174.9453125, 180.03515625, 185.125]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 39.0, 465.0, 464.0, 42.0, 3.0], "bins": [-543.4522705078125, -534.5348510742188, -525.6173706054688, -516.699951171875, -507.7825012207031, -498.86505126953125, -489.9476013183594, -481.0301513671875, -472.11273193359375, -463.1952819824219, -454.27783203125, -445.36041259765625, -436.4429626464844, -427.5255126953125, -418.6080627441406, -409.69061279296875, -400.773193359375, -391.8557434082031, -382.93829345703125, -374.0208740234375, -365.1034240722656, -356.18597412109375, -347.2685241699219, -338.35107421875, -329.4336242675781, -320.51617431640625, -311.5987243652344, -302.6813049316406, -293.76385498046875, -284.8464050292969, -275.928955078125, -267.01153564453125, -258.0940856933594, -249.1766357421875, -240.2592010498047, -231.3417510986328, -222.42431640625, -213.50686645507812, -204.58941650390625, -195.67198181152344, -186.75453186035156, -177.8370819091797, -168.91964721679688, -160.002197265625, -151.0847625732422, -142.1673126220703, -133.2498779296875, -124.33242797851562, -115.41497802734375, -106.4975357055664, -97.58009338378906, -88.66264343261719, -79.74520874023438, -70.8277587890625, -61.910316467285156, -52.99287414550781, -44.07543182373047, -35.157989501953125, -26.24054527282715, -17.323101043701172, -8.405658721923828, 0.5117835998535156, 9.429229736328125, 18.34667205810547, 27.26411247253418]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 3.0, 0.0, 1.0, 9.0, 6.0, 7.0, 8.0, 15.0, 9.0, 18.0, 18.0, 17.0, 28.0, 33.0, 33.0, 26.0, 32.0, 36.0, 26.0, 38.0, 31.0, 28.0, 28.0, 39.0, 47.0, 40.0, 48.0, 37.0, 44.0, 34.0, 24.0, 26.0, 31.0, 21.0, 29.0, 13.0, 18.0, 15.0, 22.0, 15.0, 5.0, 11.0, 5.0, 7.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-147.72052001953125, -142.8674774169922, -138.01443481445312, -133.16139221191406, -128.308349609375, -123.45530700683594, -118.60225677490234, -113.74921417236328, -108.89617156982422, -104.04312896728516, -99.1900863647461, -94.33704376220703, -89.48399353027344, -84.63095092773438, -79.77790832519531, -74.92486572265625, -70.07182312011719, -65.21878051757812, -60.36573791503906, -55.512691497802734, -50.65964889526367, -45.80660629272461, -40.95355987548828, -36.10051727294922, -31.247474670410156, -26.394432067871094, -21.5413875579834, -16.688343048095703, -11.83530044555664, -6.982257843017578, -2.129213333129883, 2.7238311767578125, 7.5768585205078125, 12.429902076721191, 17.28294563293457, 22.135990142822266, 26.989032745361328, 31.84207534790039, 36.69512176513672, 41.54816436767578, 46.401206970214844, 51.254249572753906, 56.10729217529297, 60.9603385925293, 65.81338500976562, 70.66642761230469, 75.51947021484375, 80.37251281738281, 85.22555541992188, 90.07859802246094, 94.931640625, 99.78468322753906, 104.63772583007812, 109.49076843261719, 114.34381866455078, 119.19686126708984, 124.0499038696289, 128.9029541015625, 133.75599670410156, 138.60903930664062, 143.4620819091797, 148.31512451171875, 153.1681671142578, 158.02120971679688, 162.87425231933594]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 6.0, 2.0, 3.0, 7.0, 6.0, 9.0, 9.0, 7.0, 9.0, 12.0, 15.0, 16.0, 33.0, 28.0, 27.0, 40.0, 37.0, 34.0, 41.0, 38.0, 57.0, 35.0, 57.0, 47.0, 35.0, 33.0, 39.0, 44.0, 29.0, 44.0, 26.0, 35.0, 23.0, 24.0, 15.0, 15.0, 17.0, 15.0, 9.0, 8.0, 6.0, 6.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.78125, -21.069580078125, -20.35791015625, -19.646240234375, -18.9345703125, -18.222900390625, -17.51123046875, -16.799560546875, -16.087890625, -15.376220703125, -14.66455078125, -13.952880859375, -13.2412109375, -12.529541015625, -11.81787109375, -11.106201171875, -10.39453125, -9.682861328125, -8.97119140625, -8.259521484375, -7.5478515625, -6.836181640625, -6.12451171875, -5.412841796875, -4.701171875, -3.989501953125, -3.27783203125, -2.566162109375, -1.8544921875, -1.142822265625, -0.43115234375, 0.280517578125, 0.9921875, 1.703857421875, 2.41552734375, 3.127197265625, 3.8388671875, 4.550537109375, 5.26220703125, 5.973876953125, 6.685546875, 7.397216796875, 8.10888671875, 8.820556640625, 9.5322265625, 10.243896484375, 10.95556640625, 11.667236328125, 12.37890625, 13.090576171875, 13.80224609375, 14.513916015625, 15.2255859375, 15.937255859375, 16.64892578125, 17.360595703125, 18.072265625, 18.783935546875, 19.49560546875, 20.207275390625, 20.9189453125, 21.630615234375, 22.34228515625, 23.053955078125, 23.765625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 2.0, 7.0, 8.0, 14.0, 17.0, 22.0, 35.0, 23.0, 60.0, 82.0, 111.0, 161.0, 239.0, 380.0, 590.0, 942.0, 1553.0, 2630.0, 4939.0, 10171.0, 29701.0, 461128.0, 3346159.0, 290031.0, 25510.0, 9027.0, 4418.0, 2429.0, 1373.0, 879.0, 534.0, 346.0, 242.0, 150.0, 110.0, 68.0, 44.0, 51.0, 27.0, 19.0, 15.0, 12.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.5625, -52.76953125, -50.9765625, -49.18359375, -47.390625, -45.59765625, -43.8046875, -42.01171875, -40.21875, -38.42578125, -36.6328125, -34.83984375, -33.046875, -31.25390625, -29.4609375, -27.66796875, -25.875, -24.08203125, -22.2890625, -20.49609375, -18.703125, -16.91015625, -15.1171875, -13.32421875, -11.53125, -9.73828125, -7.9453125, -6.15234375, -4.359375, -2.56640625, -0.7734375, 1.01953125, 2.8125, 4.60546875, 6.3984375, 8.19140625, 9.984375, 11.77734375, 13.5703125, 15.36328125, 17.15625, 18.94921875, 20.7421875, 22.53515625, 24.328125, 26.12109375, 27.9140625, 29.70703125, 31.5, 33.29296875, 35.0859375, 36.87890625, 38.671875, 40.46484375, 42.2578125, 44.05078125, 45.84375, 47.63671875, 49.4296875, 51.22265625, 53.015625, 54.80859375, 56.6015625, 58.39453125, 60.1875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 6.0, 2.0, 8.0, 2.0, 9.0, 17.0, 25.0, 24.0, 44.0, 60.0, 79.0, 160.0, 389.0, 792.0, 1099.0, 734.0, 308.0, 107.0, 70.0, 39.0, 24.0, 13.0, 26.0, 7.0, 4.0, 6.0, 8.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.40625, -45.61181640625, -43.8173828125, -42.02294921875, -40.228515625, -38.43408203125, -36.6396484375, -34.84521484375, -33.05078125, -31.25634765625, -29.4619140625, -27.66748046875, -25.873046875, -24.07861328125, -22.2841796875, -20.48974609375, -18.6953125, -16.90087890625, -15.1064453125, -13.31201171875, -11.517578125, -9.72314453125, -7.9287109375, -6.13427734375, -4.33984375, -2.54541015625, -0.7509765625, 1.04345703125, 2.837890625, 4.63232421875, 6.4267578125, 8.22119140625, 10.015625, 11.81005859375, 13.6044921875, 15.39892578125, 17.193359375, 18.98779296875, 20.7822265625, 22.57666015625, 24.37109375, 26.16552734375, 27.9599609375, 29.75439453125, 31.548828125, 33.34326171875, 35.1376953125, 36.93212890625, 38.7265625, 40.52099609375, 42.3154296875, 44.10986328125, 45.904296875, 47.69873046875, 49.4931640625, 51.28759765625, 53.08203125, 54.87646484375, 56.6708984375, 58.46533203125, 60.259765625, 62.05419921875, 63.8486328125, 65.64306640625, 67.4375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 0.0, 4.0, 4.0, 7.0, 10.0, 20.0, 24.0, 37.0, 57.0, 113.0, 157.0, 294.0, 639.0, 1361.0, 3582.0, 11358.0, 51378.0, 2296749.0, 1764045.0, 47434.0, 10753.0, 3448.0, 1387.0, 648.0, 310.0, 180.0, 97.0, 71.0, 31.0, 29.0, 18.0, 9.0, 14.0, 8.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-122.5, -119.1875, -115.875, -112.5625, -109.25, -105.9375, -102.625, -99.3125, -96.0, -92.6875, -89.375, -86.0625, -82.75, -79.4375, -76.125, -72.8125, -69.5, -66.1875, -62.875, -59.5625, -56.25, -52.9375, -49.625, -46.3125, -43.0, -39.6875, -36.375, -33.0625, -29.75, -26.4375, -23.125, -19.8125, -16.5, -13.1875, -9.875, -6.5625, -3.25, 0.0625, 3.375, 6.6875, 10.0, 13.3125, 16.625, 19.9375, 23.25, 26.5625, 29.875, 33.1875, 36.5, 39.8125, 43.125, 46.4375, 49.75, 53.0625, 56.375, 59.6875, 63.0, 66.3125, 69.625, 72.9375, 76.25, 79.5625, 82.875, 86.1875, 89.5]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 9.0, 16.0, 39.0, 74.0, 120.0, 249.0, 253.0, 128.0, 56.0, 33.0, 14.0, 8.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-329.2846374511719, -320.6351318359375, -311.98565673828125, -303.3361511230469, -294.6866760253906, -286.03717041015625, -277.3876953125, -268.7381896972656, -260.08868408203125, -251.43919372558594, -242.78970336914062, -234.14019775390625, -225.49070739746094, -216.84121704101562, -208.1917266845703, -199.542236328125, -190.8927459716797, -182.24325561523438, -173.59376525878906, -164.94427490234375, -156.29476928710938, -147.64527893066406, -138.99578857421875, -130.34629821777344, -121.6968002319336, -113.04730987548828, -104.39781188964844, -95.74832153320312, -87.09883117675781, -78.44933319091797, -69.79984283447266, -61.15034866333008, -52.50083923339844, -43.85134506225586, -35.20185089111328, -26.55236053466797, -17.90286636352539, -9.253372192382812, -0.6038818359375, 8.045612335205078, 16.695106506347656, 25.344600677490234, 33.99409484863281, 42.643585205078125, 51.2930793762207, 59.94257354736328, 68.5920639038086, 77.24156188964844, 85.89105224609375, 94.54054260253906, 103.1900405883789, 111.83953094482422, 120.48902893066406, 129.13851928710938, 137.7880096435547, 146.4375, 155.08700561523438, 163.7364959716797, 172.385986328125, 181.03549194335938, 189.6849822998047, 198.33447265625, 206.9839630126953, 215.63345336914062, 224.28294372558594]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 7.0, 9.0, 8.0, 11.0, 12.0, 8.0, 19.0, 18.0, 22.0, 20.0, 28.0, 32.0, 37.0, 32.0, 30.0, 35.0, 42.0, 48.0, 32.0, 41.0, 32.0, 25.0, 32.0, 34.0, 50.0, 22.0, 36.0, 30.0, 28.0, 18.0, 31.0, 21.0, 26.0, 15.0, 22.0, 10.0, 5.0, 13.0, 13.0, 7.0, 7.0, 3.0, 3.0, 8.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0], "bins": [-106.82841491699219, -103.62236785888672, -100.41631317138672, -97.21026611328125, -94.00421905517578, -90.79817199707031, -87.59211730957031, -84.38607025146484, -81.18002319335938, -77.9739761352539, -74.7679214477539, -71.56187438964844, -68.35582733154297, -65.1497802734375, -61.9437255859375, -58.73767852783203, -55.5316276550293, -52.32557678222656, -49.119529724121094, -45.91347885131836, -42.70743179321289, -39.501380920410156, -36.29533386230469, -33.08928298950195, -29.88323402404785, -26.67718505859375, -23.47113609313965, -20.265087127685547, -17.059036254882812, -13.852987289428711, -10.64693832397461, -7.440889358520508, -4.234840393066406, -1.0287911891937256, 2.177258014678955, 5.383307456970215, 8.589356422424316, 11.795406341552734, 15.001455307006836, 18.207504272460938, 21.41355323791504, 24.61960220336914, 27.825651168823242, 31.031700134277344, 34.23775100708008, 37.44380187988281, 40.64984893798828, 43.85589599609375, 47.061946868896484, 50.26799774169922, 53.47404479980469, 56.68009567260742, 59.88614273071289, 63.092193603515625, 66.2982406616211, 69.50428771972656, 72.71034240722656, 75.91638946533203, 79.12244415283203, 82.3284912109375, 85.53453826904297, 88.74058532714844, 91.94664001464844, 95.1526870727539, 98.35873413085938]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 6.0, 9.0, 7.0, 10.0, 15.0, 8.0, 15.0, 19.0, 17.0, 25.0, 29.0, 27.0, 28.0, 38.0, 37.0, 35.0, 39.0, 66.0, 37.0, 41.0, 40.0, 37.0, 31.0, 45.0, 32.0, 21.0, 30.0, 26.0, 34.0, 32.0, 20.0, 20.0, 12.0, 17.0, 13.0, 15.0, 6.0, 17.0, 10.0, 6.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.8125, -21.1240234375, -20.435546875, -19.7470703125, -19.05859375, -18.3701171875, -17.681640625, -16.9931640625, -16.3046875, -15.6162109375, -14.927734375, -14.2392578125, -13.55078125, -12.8623046875, -12.173828125, -11.4853515625, -10.796875, -10.1083984375, -9.419921875, -8.7314453125, -8.04296875, -7.3544921875, -6.666015625, -5.9775390625, -5.2890625, -4.6005859375, -3.912109375, -3.2236328125, -2.53515625, -1.8466796875, -1.158203125, -0.4697265625, 0.21875, 0.9072265625, 1.595703125, 2.2841796875, 2.97265625, 3.6611328125, 4.349609375, 5.0380859375, 5.7265625, 6.4150390625, 7.103515625, 7.7919921875, 8.48046875, 9.1689453125, 9.857421875, 10.5458984375, 11.234375, 11.9228515625, 12.611328125, 13.2998046875, 13.98828125, 14.6767578125, 15.365234375, 16.0537109375, 16.7421875, 17.4306640625, 18.119140625, 18.8076171875, 19.49609375, 20.1845703125, 20.873046875, 21.5615234375, 22.25]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 11.0, 7.0, 13.0, 28.0, 34.0, 58.0, 66.0, 117.0, 208.0, 300.0, 425.0, 587.0, 962.0, 1385.0, 2101.0, 3270.0, 4822.0, 7409.0, 11044.0, 17119.0, 27326.0, 44723.0, 78191.0, 151878.0, 287703.0, 181855.0, 90536.0, 50566.0, 30421.0, 19240.0, 12188.0, 8056.0, 5361.0, 3510.0, 2384.0, 1522.0, 1033.0, 722.0, 459.0, 302.0, 235.0, 131.0, 75.0, 61.0, 39.0, 24.0, 20.0, 12.0, 9.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.01953125, -1.955657958984375, -1.89178466796875, -1.827911376953125, -1.7640380859375, -1.700164794921875, -1.63629150390625, -1.572418212890625, -1.508544921875, -1.444671630859375, -1.38079833984375, -1.316925048828125, -1.2530517578125, -1.189178466796875, -1.12530517578125, -1.061431884765625, -0.99755859375, -0.933685302734375, -0.86981201171875, -0.805938720703125, -0.7420654296875, -0.678192138671875, -0.61431884765625, -0.550445556640625, -0.486572265625, -0.422698974609375, -0.35882568359375, -0.294952392578125, -0.2310791015625, -0.167205810546875, -0.10333251953125, -0.039459228515625, 0.0244140625, 0.088287353515625, 0.15216064453125, 0.216033935546875, 0.2799072265625, 0.343780517578125, 0.40765380859375, 0.471527099609375, 0.535400390625, 0.599273681640625, 0.66314697265625, 0.727020263671875, 0.7908935546875, 0.854766845703125, 0.91864013671875, 0.982513427734375, 1.04638671875, 1.110260009765625, 1.17413330078125, 1.238006591796875, 1.3018798828125, 1.365753173828125, 1.42962646484375, 1.493499755859375, 1.557373046875, 1.621246337890625, 1.68511962890625, 1.748992919921875, 1.8128662109375, 1.876739501953125, 1.94061279296875, 2.004486083984375, 2.068359375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 11.0, 8.0, 9.0, 11.0, 9.0, 19.0, 26.0, 24.0, 34.0, 24.0, 37.0, 46.0, 43.0, 35.0, 38.0, 42.0, 49.0, 1081.0, 35.0, 58.0, 44.0, 37.0, 42.0, 36.0, 34.0, 28.0, 28.0, 22.0, 16.0, 21.0, 17.0, 15.0, 3.0, 7.0, 6.0, 8.0, 5.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.62744140625, -15.1142578125, -14.60107421875, -14.087890625, -13.57470703125, -13.0615234375, -12.54833984375, -12.03515625, -11.52197265625, -11.0087890625, -10.49560546875, -9.982421875, -9.46923828125, -8.9560546875, -8.44287109375, -7.9296875, -7.41650390625, -6.9033203125, -6.39013671875, -5.876953125, -5.36376953125, -4.8505859375, -4.33740234375, -3.82421875, -3.31103515625, -2.7978515625, -2.28466796875, -1.771484375, -1.25830078125, -0.7451171875, -0.23193359375, 0.28125, 0.79443359375, 1.3076171875, 1.82080078125, 2.333984375, 2.84716796875, 3.3603515625, 3.87353515625, 4.38671875, 4.89990234375, 5.4130859375, 5.92626953125, 6.439453125, 6.95263671875, 7.4658203125, 7.97900390625, 8.4921875, 9.00537109375, 9.5185546875, 10.03173828125, 10.544921875, 11.05810546875, 11.5712890625, 12.08447265625, 12.59765625, 13.11083984375, 13.6240234375, 14.13720703125, 14.650390625, 15.16357421875, 15.6767578125, 16.18994140625, 16.703125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 8.0, 1.0, 4.0, 14.0, 17.0, 18.0, 27.0, 46.0, 50.0, 87.0, 133.0, 177.0, 341.0, 486.0, 773.0, 1198.0, 2159.0, 3420.0, 5801.0, 9629.0, 16772.0, 30644.0, 57926.0, 120972.0, 1332585.0, 280639.0, 111806.0, 54146.0, 28307.0, 15906.0, 9028.0, 5410.0, 3268.0, 1988.0, 1246.0, 734.0, 486.0, 294.0, 185.0, 134.0, 92.0, 61.0, 31.0, 30.0, 23.0, 18.0, 8.0, 4.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.453125, -2.3763427734375, -2.299560546875, -2.2227783203125, -2.14599609375, -2.0692138671875, -1.992431640625, -1.9156494140625, -1.8388671875, -1.7620849609375, -1.685302734375, -1.6085205078125, -1.53173828125, -1.4549560546875, -1.378173828125, -1.3013916015625, -1.224609375, -1.1478271484375, -1.071044921875, -0.9942626953125, -0.91748046875, -0.8406982421875, -0.763916015625, -0.6871337890625, -0.6103515625, -0.5335693359375, -0.456787109375, -0.3800048828125, -0.30322265625, -0.2264404296875, -0.149658203125, -0.0728759765625, 0.00390625, 0.0806884765625, 0.157470703125, 0.2342529296875, 0.31103515625, 0.3878173828125, 0.464599609375, 0.5413818359375, 0.6181640625, 0.6949462890625, 0.771728515625, 0.8485107421875, 0.92529296875, 1.0020751953125, 1.078857421875, 1.1556396484375, 1.232421875, 1.3092041015625, 1.385986328125, 1.4627685546875, 1.53955078125, 1.6163330078125, 1.693115234375, 1.7698974609375, 1.8466796875, 1.9234619140625, 2.000244140625, 2.0770263671875, 2.15380859375, 2.2305908203125, 2.307373046875, 2.3841552734375, 2.4609375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 7.0, 7.0, 8.0, 2.0, 11.0, 19.0, 18.0, 20.0, 24.0, 34.0, 44.0, 57.0, 56.0, 74.0, 82.0, 61.0, 92.0, 74.0, 57.0, 56.0, 43.0, 27.0, 35.0, 26.0, 15.0, 11.0, 6.0, 2.0, 9.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005584716796875, -0.005389988422393799, -0.005195260047912598, -0.0050005316734313965, -0.004805803298950195, -0.004611074924468994, -0.004416346549987793, -0.004221618175506592, -0.004026889801025391, -0.0038321614265441895, -0.0036374330520629883, -0.003442704677581787, -0.003247976303100586, -0.0030532479286193848, -0.0028585195541381836, -0.0026637911796569824, -0.0024690628051757812, -0.00227433443069458, -0.002079606056213379, -0.0018848776817321777, -0.0016901493072509766, -0.0014954209327697754, -0.0013006925582885742, -0.001105964183807373, -0.0009112358093261719, -0.0007165074348449707, -0.0005217790603637695, -0.00032705068588256836, -0.0001323223114013672, 6.240606307983398e-05, 0.00025713443756103516, 0.00045186281204223633, 0.0006465911865234375, 0.0008413195610046387, 0.0010360479354858398, 0.001230776309967041, 0.0014255046844482422, 0.0016202330589294434, 0.0018149614334106445, 0.0020096898078918457, 0.002204418182373047, 0.002399146556854248, 0.0025938749313354492, 0.0027886033058166504, 0.0029833316802978516, 0.0031780600547790527, 0.003372788429260254, 0.003567516803741455, 0.0037622451782226562, 0.003956973552703857, 0.004151701927185059, 0.00434643030166626, 0.004541158676147461, 0.004735887050628662, 0.004930615425109863, 0.0051253437995910645, 0.005320072174072266, 0.005514800548553467, 0.005709528923034668, 0.005904257297515869, 0.00609898567199707, 0.0062937140464782715, 0.006488442420959473, 0.006683170795440674, 0.006877899169921875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 4.0, 6.0, 7.0, 14.0, 4.0, 10.0, 16.0, 22.0, 41.0, 55.0, 82.0, 96.0, 139.0, 239.0, 422.0, 1600.0, 722588.0, 320760.0, 1237.0, 422.0, 229.0, 147.0, 94.0, 79.0, 45.0, 41.0, 39.0, 15.0, 20.0, 9.0, 15.0, 12.0, 9.0, 7.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.1304931640625, -0.1268625259399414, -0.12323188781738281, -0.11960124969482422, -0.11597061157226562, -0.11233997344970703, -0.10870933532714844, -0.10507869720458984, -0.10144805908203125, -0.09781742095947266, -0.09418678283691406, -0.09055614471435547, -0.08692550659179688, -0.08329486846923828, -0.07966423034667969, -0.0760335922241211, -0.0724029541015625, -0.0687723159790039, -0.06514167785644531, -0.06151103973388672, -0.057880401611328125, -0.05424976348876953, -0.05061912536621094, -0.046988487243652344, -0.04335784912109375, -0.039727210998535156, -0.03609657287597656, -0.03246593475341797, -0.028835296630859375, -0.02520465850830078, -0.021574020385742188, -0.017943382263183594, -0.014312744140625, -0.010682106018066406, -0.0070514678955078125, -0.0034208297729492188, 0.000209808349609375, 0.0038404464721679688, 0.0074710845947265625, 0.011101722717285156, 0.01473236083984375, 0.018362998962402344, 0.021993637084960938, 0.02562427520751953, 0.029254913330078125, 0.03288555145263672, 0.03651618957519531, 0.040146827697753906, 0.0437774658203125, 0.047408103942871094, 0.05103874206542969, 0.05466938018798828, 0.058300018310546875, 0.06193065643310547, 0.06556129455566406, 0.06919193267822266, 0.07282257080078125, 0.07645320892333984, 0.08008384704589844, 0.08371448516845703, 0.08734512329101562, 0.09097576141357422, 0.09460639953613281, 0.0982370376586914, 0.10186767578125]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 0.0, 19.0, 30.0, 119.0, 250.0, 302.0, 193.0, 64.0, 26.0, 8.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002334680175408721, -0.002080495934933424, -0.0018263118108734488, -0.0015721276868134737, -0.0013179434463381767, -0.0010637592058628798, -0.0008095750818029046, -0.0005553909577429295, -0.0003012067172676325, -4.7022534999996424e-05, 0.00020716164726763964, 0.0004613458295352757, 0.0007155300118029118, 0.0009697142522782087, 0.0012238983763381839, 0.001478082500398159, 0.001732266740873456, 0.001986450981348753, 0.0022406349889934063, 0.0024948192294687033, 0.0027490034699440002, 0.0030031877104192972, 0.003257371950894594, 0.0035115559585392475, 0.0037657401990145445, 0.0040199244394898415, 0.004274108447134495, 0.004528292920440435, 0.004782476928085089, 0.005036661401391029, 0.005290845409035683, 0.005545029416680336, 0.005799214355647564, 0.006053398363292217, 0.006307582836598158, 0.006561766844242811, 0.006815951317548752, 0.007070135325193405, 0.0073243193328380585, 0.007578503340482712, 0.007832687348127365, 0.008086871355772018, 0.008341055363416672, 0.0085952403023839, 0.008849424310028553, 0.009103608317673206, 0.00935779232531786, 0.009611976332962513, 0.009866161271929741, 0.010120345279574394, 0.010374529287219048, 0.010628714226186275, 0.010882898233830929, 0.011137082241475582, 0.011391266249120235, 0.011645450256764889, 0.011899635195732117, 0.01215381920337677, 0.012408003211021423, 0.012662188149988651, 0.012916372157633305, 0.013170556165277958, 0.013424740172922611, 0.013678924180567265, 0.013933108188211918]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 8.0, 16.0, 15.0, 12.0, 17.0, 11.0, 21.0, 18.0, 28.0, 20.0, 27.0, 24.0, 30.0, 35.0, 39.0, 43.0, 33.0, 36.0, 47.0, 44.0, 49.0, 44.0, 43.0, 33.0, 36.0, 30.0, 30.0, 31.0, 28.0, 23.0, 20.0, 10.0, 17.0, 15.0, 16.0, 9.0, 6.0, 8.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026065707206726074, -0.0025192173197865486, -0.00243186391890049, -0.002344510518014431, -0.002257157117128372, -0.0021698037162423134, -0.0020824503153562546, -0.0019950969144701958, -0.001907743513584137, -0.0018203901126980782, -0.0017330367118120193, -0.0016456833109259605, -0.0015583299100399017, -0.001470976509153843, -0.0013836231082677841, -0.0012962697073817253, -0.0012089163064956665, -0.0011215629056096077, -0.0010342095047235489, -0.0009468561038374901, -0.0008595027029514313, -0.0007721493020653725, -0.0006847959011793137, -0.0005974425002932549, -0.000510089099407196, -0.00042273569852113724, -0.00033538229763507843, -0.0002480288967490196, -0.00016067549586296082, -7.332209497690201e-05, 1.40313059091568e-05, 0.0001013847067952156, 0.00018873810768127441, 0.0002760915085673332, 0.00036344490945339203, 0.00045079831033945084, 0.0005381517112255096, 0.0006255051121115685, 0.0007128585129976273, 0.0008002119138836861, 0.0008875653147697449, 0.0009749187156558037, 0.0010622721165418625, 0.0011496255174279213, 0.00123697891831398, 0.001324332319200039, 0.0014116857200860977, 0.0014990391209721565, 0.0015863925218582153, 0.0016737459227442741, 0.001761099323630333, 0.0018484527245163918, 0.0019358061254024506, 0.0020231595262885094, 0.002110512927174568, 0.002197866328060627, 0.002285219728946686, 0.0023725731298327446, 0.0024599265307188034, 0.002547279931604862, 0.002634633332490921, 0.00272198673337698, 0.0028093401342630386, 0.0028966935351490974, 0.0029840469360351562]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 6.0, 9.0, 7.0, 10.0, 15.0, 8.0, 15.0, 19.0, 17.0, 25.0, 29.0, 27.0, 28.0, 38.0, 37.0, 35.0, 39.0, 66.0, 37.0, 41.0, 40.0, 37.0, 31.0, 45.0, 32.0, 21.0, 30.0, 26.0, 34.0, 32.0, 20.0, 20.0, 12.0, 17.0, 13.0, 15.0, 6.0, 17.0, 10.0, 6.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.8125, -21.1240234375, -20.435546875, -19.7470703125, -19.05859375, -18.3701171875, -17.681640625, -16.9931640625, -16.3046875, -15.6162109375, -14.927734375, -14.2392578125, -13.55078125, -12.8623046875, -12.173828125, -11.4853515625, -10.796875, -10.1083984375, -9.419921875, -8.7314453125, -8.04296875, -7.3544921875, -6.666015625, -5.9775390625, -5.2890625, -4.6005859375, -3.912109375, -3.2236328125, -2.53515625, -1.8466796875, -1.158203125, -0.4697265625, 0.21875, 0.9072265625, 1.595703125, 2.2841796875, 2.97265625, 3.6611328125, 4.349609375, 5.0380859375, 5.7265625, 6.4150390625, 7.103515625, 7.7919921875, 8.48046875, 9.1689453125, 9.857421875, 10.5458984375, 11.234375, 11.9228515625, 12.611328125, 13.2998046875, 13.98828125, 14.6767578125, 15.365234375, 16.0537109375, 16.7421875, 17.4306640625, 18.119140625, 18.8076171875, 19.49609375, 20.1845703125, 20.873046875, 21.5615234375, 22.25]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 7.0, 11.0, 16.0, 15.0, 19.0, 15.0, 26.0, 36.0, 29.0, 37.0, 64.0, 74.0, 115.0, 162.0, 179.0, 273.0, 333.0, 507.0, 695.0, 1203.0, 3562.0, 25908.0, 854425.0, 146867.0, 8834.0, 1937.0, 983.0, 576.0, 404.0, 262.0, 235.0, 170.0, 132.0, 102.0, 69.0, 48.0, 56.0, 30.0, 34.0, 26.0, 22.0, 16.0, 9.0, 6.0, 7.0, 8.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-55.875, -54.1162109375, -52.357421875, -50.5986328125, -48.83984375, -47.0810546875, -45.322265625, -43.5634765625, -41.8046875, -40.0458984375, -38.287109375, -36.5283203125, -34.76953125, -33.0107421875, -31.251953125, -29.4931640625, -27.734375, -25.9755859375, -24.216796875, -22.4580078125, -20.69921875, -18.9404296875, -17.181640625, -15.4228515625, -13.6640625, -11.9052734375, -10.146484375, -8.3876953125, -6.62890625, -4.8701171875, -3.111328125, -1.3525390625, 0.40625, 2.1650390625, 3.923828125, 5.6826171875, 7.44140625, 9.2001953125, 10.958984375, 12.7177734375, 14.4765625, 16.2353515625, 17.994140625, 19.7529296875, 21.51171875, 23.2705078125, 25.029296875, 26.7880859375, 28.546875, 30.3056640625, 32.064453125, 33.8232421875, 35.58203125, 37.3408203125, 39.099609375, 40.8583984375, 42.6171875, 44.3759765625, 46.134765625, 47.8935546875, 49.65234375, 51.4111328125, 53.169921875, 54.9287109375, 56.6875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 6.0, 1.0, 8.0, 7.0, 3.0, 9.0, 12.0, 14.0, 17.0, 13.0, 17.0, 19.0, 19.0, 20.0, 23.0, 30.0, 28.0, 37.0, 32.0, 45.0, 61.0, 71.0, 187.0, 1770.0, 123.0, 72.0, 47.0, 30.0, 42.0, 37.0, 32.0, 23.0, 23.0, 29.0, 21.0, 12.0, 28.0, 17.0, 11.0, 15.0, 2.0, 9.0, 4.0, 9.0, 5.0, 4.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-62.46875, -60.5380859375, -58.607421875, -56.6767578125, -54.74609375, -52.8154296875, -50.884765625, -48.9541015625, -47.0234375, -45.0927734375, -43.162109375, -41.2314453125, -39.30078125, -37.3701171875, -35.439453125, -33.5087890625, -31.578125, -29.6474609375, -27.716796875, -25.7861328125, -23.85546875, -21.9248046875, -19.994140625, -18.0634765625, -16.1328125, -14.2021484375, -12.271484375, -10.3408203125, -8.41015625, -6.4794921875, -4.548828125, -2.6181640625, -0.6875, 1.2431640625, 3.173828125, 5.1044921875, 7.03515625, 8.9658203125, 10.896484375, 12.8271484375, 14.7578125, 16.6884765625, 18.619140625, 20.5498046875, 22.48046875, 24.4111328125, 26.341796875, 28.2724609375, 30.203125, 32.1337890625, 34.064453125, 35.9951171875, 37.92578125, 39.8564453125, 41.787109375, 43.7177734375, 45.6484375, 47.5791015625, 49.509765625, 51.4404296875, 53.37109375, 55.3017578125, 57.232421875, 59.1630859375, 61.09375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 7.0, 4.0, 7.0, 4.0, 17.0, 9.0, 15.0, 27.0, 17.0, 25.0, 31.0, 24.0, 35.0, 44.0, 59.0, 86.0, 124.0, 256.0, 691.0, 9122.0, 3114356.0, 18958.0, 918.0, 273.0, 148.0, 81.0, 80.0, 46.0, 37.0, 26.0, 23.0, 23.0, 15.0, 20.0, 11.0, 15.0, 13.0, 10.0, 9.0, 5.0, 5.0, 9.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-172.0, -166.552734375, -161.10546875, -155.658203125, -150.2109375, -144.763671875, -139.31640625, -133.869140625, -128.421875, -122.974609375, -117.52734375, -112.080078125, -106.6328125, -101.185546875, -95.73828125, -90.291015625, -84.84375, -79.396484375, -73.94921875, -68.501953125, -63.0546875, -57.607421875, -52.16015625, -46.712890625, -41.265625, -35.818359375, -30.37109375, -24.923828125, -19.4765625, -14.029296875, -8.58203125, -3.134765625, 2.3125, 7.759765625, 13.20703125, 18.654296875, 24.1015625, 29.548828125, 34.99609375, 40.443359375, 45.890625, 51.337890625, 56.78515625, 62.232421875, 67.6796875, 73.126953125, 78.57421875, 84.021484375, 89.46875, 94.916015625, 100.36328125, 105.810546875, 111.2578125, 116.705078125, 122.15234375, 127.599609375, 133.046875, 138.494140625, 143.94140625, 149.388671875, 154.8359375, 160.283203125, 165.73046875, 171.177734375, 176.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 6.0, 4.0, 12.0, 16.0, 52.0, 54.0, 102.0, 135.0, 186.0, 162.0, 102.0, 87.0, 51.0, 21.0, 11.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.716815948486328, -22.757423400878906, -20.79802894592285, -18.83863639831543, -16.879241943359375, -14.919849395751953, -12.960456848144531, -11.001063346862793, -9.041669845581055, -7.082276344299316, -5.122883319854736, -3.1634902954101562, -1.204096794128418, 0.7552967071533203, 2.714689254760742, 4.6740827560424805, 6.633476257324219, 8.592869758605957, 10.552263259887695, 12.511655807495117, 14.471049308776855, 16.430442810058594, 18.389835357666016, 20.349227905273438, 22.308622360229492, 24.268014907836914, 26.22740936279297, 28.18680191040039, 30.146194458007812, 32.1055908203125, 34.064979553222656, 36.024375915527344, 37.9837646484375, 39.94315719604492, 41.902549743652344, 43.86194610595703, 45.82133865356445, 47.780731201171875, 49.7401237487793, 51.69951629638672, 53.658912658691406, 55.61830520629883, 57.57769775390625, 59.53709411621094, 61.49648666381836, 63.45587921142578, 65.41526794433594, 67.37466430664062, 69.33406066894531, 71.29345703125, 73.25284576416016, 75.21224212646484, 77.171630859375, 79.13102722167969, 81.09042358398438, 83.04981231689453, 85.00920104980469, 86.96859741210938, 88.92798614501953, 90.88738250732422, 92.84677124023438, 94.80616760253906, 96.76556396484375, 98.7249526977539, 100.6843490600586]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 8.0, 8.0, 7.0, 8.0, 12.0, 8.0, 13.0, 16.0, 20.0, 13.0, 22.0, 23.0, 23.0, 24.0, 24.0, 34.0, 26.0, 31.0, 44.0, 35.0, 40.0, 37.0, 50.0, 37.0, 43.0, 30.0, 38.0, 31.0, 33.0, 30.0, 31.0, 33.0, 21.0, 19.0, 15.0, 13.0, 14.0, 12.0, 13.0, 15.0, 10.0, 7.0, 5.0, 6.0, 1.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-149.4180908203125, -144.63487243652344, -139.85165405273438, -135.0684356689453, -130.28521728515625, -125.50199890136719, -120.71878814697266, -115.9355697631836, -111.15235137939453, -106.36913299560547, -101.5859146118164, -96.80269622802734, -92.01948547363281, -87.23626708984375, -82.45304870605469, -77.66983032226562, -72.88661193847656, -68.1033935546875, -63.32017517089844, -58.53696060180664, -53.75374221801758, -48.970523834228516, -44.18730926513672, -39.404090881347656, -34.620872497558594, -29.83765411376953, -25.0544376373291, -20.271221160888672, -15.48800277709961, -10.704784393310547, -5.921567916870117, -1.1383514404296875, 3.6448516845703125, 8.428069114685059, 13.211286544799805, 17.994503021240234, 22.777721405029297, 27.56093978881836, 32.344154357910156, 37.12737274169922, 41.91059112548828, 46.693809509277344, 51.477027893066406, 56.2602424621582, 61.043460845947266, 65.82667541503906, 70.60989379882812, 75.39311218261719, 80.17633056640625, 84.95954895019531, 89.74276733398438, 94.52598571777344, 99.3092041015625, 104.09242248535156, 108.8756332397461, 113.65885162353516, 118.44207000732422, 123.22528839111328, 128.0084991455078, 132.79171752929688, 137.57493591308594, 142.358154296875, 147.14137268066406, 151.92459106445312, 156.7078094482422]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 3.0, 13.0, 11.0, 8.0, 7.0, 6.0, 13.0, 15.0, 17.0, 12.0, 20.0, 32.0, 26.0, 36.0, 20.0, 44.0, 37.0, 38.0, 44.0, 45.0, 53.0, 44.0, 32.0, 31.0, 40.0, 35.0, 22.0, 35.0, 41.0, 24.0, 27.0, 27.0, 13.0, 24.0, 17.0, 14.0, 16.0, 14.0, 11.0, 6.0, 7.0, 6.0, 2.0, 4.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.84375, -21.147705078125, -20.45166015625, -19.755615234375, -19.0595703125, -18.363525390625, -17.66748046875, -16.971435546875, -16.275390625, -15.579345703125, -14.88330078125, -14.187255859375, -13.4912109375, -12.795166015625, -12.09912109375, -11.403076171875, -10.70703125, -10.010986328125, -9.31494140625, -8.618896484375, -7.9228515625, -7.226806640625, -6.53076171875, -5.834716796875, -5.138671875, -4.442626953125, -3.74658203125, -3.050537109375, -2.3544921875, -1.658447265625, -0.96240234375, -0.266357421875, 0.4296875, 1.125732421875, 1.82177734375, 2.517822265625, 3.2138671875, 3.909912109375, 4.60595703125, 5.302001953125, 5.998046875, 6.694091796875, 7.39013671875, 8.086181640625, 8.7822265625, 9.478271484375, 10.17431640625, 10.870361328125, 11.56640625, 12.262451171875, 12.95849609375, 13.654541015625, 14.3505859375, 15.046630859375, 15.74267578125, 16.438720703125, 17.134765625, 17.830810546875, 18.52685546875, 19.222900390625, 19.9189453125, 20.614990234375, 21.31103515625, 22.007080078125, 22.703125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 7.0, 9.0, 9.0, 18.0, 19.0, 21.0, 42.0, 51.0, 68.0, 133.0, 172.0, 232.0, 343.0, 594.0, 864.0, 1496.0, 2600.0, 4738.0, 9773.0, 23279.0, 205995.0, 3148411.0, 726526.0, 41185.0, 13073.0, 6350.0, 3249.0, 1861.0, 1109.0, 685.0, 467.0, 273.0, 190.0, 142.0, 103.0, 52.0, 41.0, 41.0, 19.0, 10.0, 16.0, 5.0, 2.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.5, -55.68603515625, -53.8720703125, -52.05810546875, -50.244140625, -48.43017578125, -46.6162109375, -44.80224609375, -42.98828125, -41.17431640625, -39.3603515625, -37.54638671875, -35.732421875, -33.91845703125, -32.1044921875, -30.29052734375, -28.4765625, -26.66259765625, -24.8486328125, -23.03466796875, -21.220703125, -19.40673828125, -17.5927734375, -15.77880859375, -13.96484375, -12.15087890625, -10.3369140625, -8.52294921875, -6.708984375, -4.89501953125, -3.0810546875, -1.26708984375, 0.546875, 2.36083984375, 4.1748046875, 5.98876953125, 7.802734375, 9.61669921875, 11.4306640625, 13.24462890625, 15.05859375, 16.87255859375, 18.6865234375, 20.50048828125, 22.314453125, 24.12841796875, 25.9423828125, 27.75634765625, 29.5703125, 31.38427734375, 33.1982421875, 35.01220703125, 36.826171875, 38.64013671875, 40.4541015625, 42.26806640625, 44.08203125, 45.89599609375, 47.7099609375, 49.52392578125, 51.337890625, 53.15185546875, 54.9658203125, 56.77978515625, 58.59375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 3.0, 9.0, 1.0, 15.0, 10.0, 19.0, 26.0, 36.0, 52.0, 76.0, 199.0, 559.0, 1366.0, 1024.0, 348.0, 119.0, 63.0, 36.0, 29.0, 30.0, 14.0, 13.0, 10.0, 9.0, 4.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.84375, -48.61474609375, -46.3857421875, -44.15673828125, -41.927734375, -39.69873046875, -37.4697265625, -35.24072265625, -33.01171875, -30.78271484375, -28.5537109375, -26.32470703125, -24.095703125, -21.86669921875, -19.6376953125, -17.40869140625, -15.1796875, -12.95068359375, -10.7216796875, -8.49267578125, -6.263671875, -4.03466796875, -1.8056640625, 0.42333984375, 2.65234375, 4.88134765625, 7.1103515625, 9.33935546875, 11.568359375, 13.79736328125, 16.0263671875, 18.25537109375, 20.484375, 22.71337890625, 24.9423828125, 27.17138671875, 29.400390625, 31.62939453125, 33.8583984375, 36.08740234375, 38.31640625, 40.54541015625, 42.7744140625, 45.00341796875, 47.232421875, 49.46142578125, 51.6904296875, 53.91943359375, 56.1484375, 58.37744140625, 60.6064453125, 62.83544921875, 65.064453125, 67.29345703125, 69.5224609375, 71.75146484375, 73.98046875, 76.20947265625, 78.4384765625, 80.66748046875, 82.896484375, 85.12548828125, 87.3544921875, 89.58349609375, 91.8125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 3.0, 12.0, 15.0, 21.0, 28.0, 65.0, 144.0, 332.0, 1021.0, 3666.0, 18575.0, 249665.0, 3860311.0, 49842.0, 7654.0, 1884.0, 570.0, 239.0, 108.0, 52.0, 32.0, 14.0, 6.0, 11.0, 0.0, 5.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-215.0, -209.787109375, -204.57421875, -199.361328125, -194.1484375, -188.935546875, -183.72265625, -178.509765625, -173.296875, -168.083984375, -162.87109375, -157.658203125, -152.4453125, -147.232421875, -142.01953125, -136.806640625, -131.59375, -126.380859375, -121.16796875, -115.955078125, -110.7421875, -105.529296875, -100.31640625, -95.103515625, -89.890625, -84.677734375, -79.46484375, -74.251953125, -69.0390625, -63.826171875, -58.61328125, -53.400390625, -48.1875, -42.974609375, -37.76171875, -32.548828125, -27.3359375, -22.123046875, -16.91015625, -11.697265625, -6.484375, -1.271484375, 3.94140625, 9.154296875, 14.3671875, 19.580078125, 24.79296875, 30.005859375, 35.21875, 40.431640625, 45.64453125, 50.857421875, 56.0703125, 61.283203125, 66.49609375, 71.708984375, 76.921875, 82.134765625, 87.34765625, 92.560546875, 97.7734375, 102.986328125, 108.19921875, 113.412109375, 118.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 10.0, 36.0, 77.0, 205.0, 306.0, 219.0, 98.0, 34.0, 13.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-538.3421020507812, -526.2870483398438, -514.23193359375, -502.1768798828125, -490.1217956542969, -478.06671142578125, -466.0116271972656, -453.95654296875, -441.9014892578125, -429.8464050292969, -417.79132080078125, -405.73626708984375, -393.6811828613281, -381.6260986328125, -369.5710144042969, -357.51593017578125, -345.4608459472656, -333.40576171875, -321.3506774902344, -309.29559326171875, -297.24053955078125, -285.1854553222656, -273.13037109375, -261.0752868652344, -249.0202178955078, -236.9651336669922, -224.91006469726562, -212.85498046875, -200.79989624023438, -188.7448272705078, -176.6897430419922, -164.63467407226562, -152.57955932617188, -140.52447509765625, -128.4694061279297, -116.41432189941406, -104.35924530029297, -92.30416870117188, -80.24908447265625, -68.19400787353516, -56.13893127441406, -44.08385467529297, -32.02877426147461, -19.97369384765625, -7.918617248535156, 4.1364593505859375, 16.191543579101562, 28.246620178222656, 40.30169677734375, 52.356773376464844, 64.41184997558594, 76.46693420410156, 88.52201080322266, 100.57708740234375, 112.63217163085938, 124.68724822998047, 136.74232482910156, 148.7974090576172, 160.85247802734375, 172.90756225585938, 184.962646484375, 197.01771545410156, 209.0727996826172, 221.12786865234375, 233.18295288085938]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 7.0, 11.0, 4.0, 12.0, 15.0, 7.0, 14.0, 19.0, 24.0, 22.0, 21.0, 29.0, 25.0, 33.0, 33.0, 28.0, 33.0, 36.0, 30.0, 31.0, 31.0, 46.0, 38.0, 43.0, 40.0, 33.0, 32.0, 32.0, 22.0, 28.0, 32.0, 22.0, 26.0, 17.0, 19.0, 19.0, 16.0, 15.0, 9.0, 5.0, 10.0, 5.0, 8.0, 1.0, 2.0, 6.0, 3.0, 3.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-117.55738830566406, -113.88167572021484, -110.2059555053711, -106.53024291992188, -102.85453033447266, -99.17881774902344, -95.50309753417969, -91.82738494873047, -88.15167236328125, -84.47595977783203, -80.80023956298828, -77.12452697753906, -73.44881439208984, -69.77310180664062, -66.09738159179688, -62.421669006347656, -58.745948791503906, -55.07023239135742, -51.3945198059082, -47.71880340576172, -44.0430908203125, -40.367374420166016, -36.69165802001953, -33.01594543457031, -29.340229034423828, -25.664514541625977, -21.988800048828125, -18.31308364868164, -14.637369155883789, -10.961654663085938, -7.285938262939453, -3.6102237701416016, 0.06548309326171875, 3.7411980628967285, 7.416913032531738, 11.092628479003906, 14.768342971801758, 18.44405746459961, 22.119773864746094, 25.795488357543945, 29.471202850341797, 33.14691925048828, 36.8226318359375, 40.498348236083984, 44.17406463623047, 47.84977722167969, 51.52549362182617, 55.201210021972656, 58.876922607421875, 62.55263900756836, 66.22835540771484, 69.90406799316406, 73.57978057861328, 77.2554931640625, 80.93121337890625, 84.60692596435547, 88.28263854980469, 91.9583511352539, 95.63407135009766, 99.30978393554688, 102.9854965209961, 106.66120910644531, 110.33692932128906, 114.01264190673828, 117.68836212158203]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 8.0, 11.0, 12.0, 11.0, 12.0, 14.0, 26.0, 13.0, 18.0, 24.0, 26.0, 25.0, 26.0, 32.0, 38.0, 35.0, 42.0, 36.0, 38.0, 40.0, 44.0, 31.0, 41.0, 37.0, 23.0, 37.0, 34.0, 22.0, 25.0, 27.0, 31.0, 13.0, 21.0, 15.0, 20.0, 18.0, 15.0, 5.0, 10.0, 7.0, 6.0, 5.0, 0.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.609375, -20.928466796875, -20.24755859375, -19.566650390625, -18.8857421875, -18.204833984375, -17.52392578125, -16.843017578125, -16.162109375, -15.481201171875, -14.80029296875, -14.119384765625, -13.4384765625, -12.757568359375, -12.07666015625, -11.395751953125, -10.71484375, -10.033935546875, -9.35302734375, -8.672119140625, -7.9912109375, -7.310302734375, -6.62939453125, -5.948486328125, -5.267578125, -4.586669921875, -3.90576171875, -3.224853515625, -2.5439453125, -1.863037109375, -1.18212890625, -0.501220703125, 0.1796875, 0.860595703125, 1.54150390625, 2.222412109375, 2.9033203125, 3.584228515625, 4.26513671875, 4.946044921875, 5.626953125, 6.307861328125, 6.98876953125, 7.669677734375, 8.3505859375, 9.031494140625, 9.71240234375, 10.393310546875, 11.07421875, 11.755126953125, 12.43603515625, 13.116943359375, 13.7978515625, 14.478759765625, 15.15966796875, 15.840576171875, 16.521484375, 17.202392578125, 17.88330078125, 18.564208984375, 19.2451171875, 19.926025390625, 20.60693359375, 21.287841796875, 21.96875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 6.0, 4.0, 10.0, 12.0, 12.0, 19.0, 28.0, 46.0, 73.0, 100.0, 140.0, 201.0, 242.0, 341.0, 533.0, 733.0, 1039.0, 1635.0, 2261.0, 3344.0, 4849.0, 7037.0, 10367.0, 15751.0, 24017.0, 38428.0, 62795.0, 112233.0, 214204.0, 237270.0, 122731.0, 68723.0, 41361.0, 26263.0, 16614.0, 11040.0, 7640.0, 5115.0, 3574.0, 2371.0, 1634.0, 1097.0, 798.0, 570.0, 381.0, 275.0, 203.0, 126.0, 95.0, 70.0, 44.0, 37.0, 32.0, 19.0, 11.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.8740234375, -1.8117218017578125, -1.749420166015625, -1.6871185302734375, -1.62481689453125, -1.5625152587890625, -1.500213623046875, -1.4379119873046875, -1.3756103515625, -1.3133087158203125, -1.251007080078125, -1.1887054443359375, -1.12640380859375, -1.0641021728515625, -1.001800537109375, -0.9394989013671875, -0.877197265625, -0.8148956298828125, -0.752593994140625, -0.6902923583984375, -0.62799072265625, -0.5656890869140625, -0.503387451171875, -0.4410858154296875, -0.3787841796875, -0.3164825439453125, -0.254180908203125, -0.1918792724609375, -0.12957763671875, -0.0672760009765625, -0.004974365234375, 0.0573272705078125, 0.11962890625, 0.1819305419921875, 0.244232177734375, 0.3065338134765625, 0.36883544921875, 0.4311370849609375, 0.493438720703125, 0.5557403564453125, 0.6180419921875, 0.6803436279296875, 0.742645263671875, 0.8049468994140625, 0.86724853515625, 0.9295501708984375, 0.991851806640625, 1.0541534423828125, 1.116455078125, 1.1787567138671875, 1.241058349609375, 1.3033599853515625, 1.36566162109375, 1.4279632568359375, 1.490264892578125, 1.5525665283203125, 1.6148681640625, 1.6771697998046875, 1.739471435546875, 1.8017730712890625, 1.86407470703125, 1.9263763427734375, 1.988677978515625, 2.0509796142578125, 2.11328125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 13.0, 9.0, 11.0, 16.0, 24.0, 22.0, 25.0, 30.0, 21.0, 31.0, 25.0, 41.0, 43.0, 28.0, 39.0, 27.0, 25.0, 43.0, 1061.0, 49.0, 38.0, 37.0, 37.0, 35.0, 34.0, 31.0, 35.0, 30.0, 20.0, 22.0, 13.0, 21.0, 14.0, 14.0, 9.0, 12.0, 9.0, 7.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-16.1875, -15.713623046875, -15.23974609375, -14.765869140625, -14.2919921875, -13.818115234375, -13.34423828125, -12.870361328125, -12.396484375, -11.922607421875, -11.44873046875, -10.974853515625, -10.5009765625, -10.027099609375, -9.55322265625, -9.079345703125, -8.60546875, -8.131591796875, -7.65771484375, -7.183837890625, -6.7099609375, -6.236083984375, -5.76220703125, -5.288330078125, -4.814453125, -4.340576171875, -3.86669921875, -3.392822265625, -2.9189453125, -2.445068359375, -1.97119140625, -1.497314453125, -1.0234375, -0.549560546875, -0.07568359375, 0.398193359375, 0.8720703125, 1.345947265625, 1.81982421875, 2.293701171875, 2.767578125, 3.241455078125, 3.71533203125, 4.189208984375, 4.6630859375, 5.136962890625, 5.61083984375, 6.084716796875, 6.55859375, 7.032470703125, 7.50634765625, 7.980224609375, 8.4541015625, 8.927978515625, 9.40185546875, 9.875732421875, 10.349609375, 10.823486328125, 11.29736328125, 11.771240234375, 12.2451171875, 12.718994140625, 13.19287109375, 13.666748046875, 14.140625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 14.0, 16.0, 25.0, 22.0, 39.0, 64.0, 98.0, 155.0, 194.0, 327.0, 560.0, 809.0, 1344.0, 2230.0, 3684.0, 6058.0, 10399.0, 17742.0, 31057.0, 55302.0, 103406.0, 226381.0, 1339675.0, 136208.0, 69478.0, 38280.0, 21819.0, 12684.0, 7494.0, 4469.0, 2697.0, 1589.0, 1025.0, 626.0, 372.0, 266.0, 164.0, 121.0, 76.0, 45.0, 37.0, 24.0, 17.0, 8.0, 12.0, 4.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.263671875, -2.188690185546875, -2.11370849609375, -2.038726806640625, -1.9637451171875, -1.888763427734375, -1.81378173828125, -1.738800048828125, -1.663818359375, -1.588836669921875, -1.51385498046875, -1.438873291015625, -1.3638916015625, -1.288909912109375, -1.21392822265625, -1.138946533203125, -1.06396484375, -0.988983154296875, -0.91400146484375, -0.839019775390625, -0.7640380859375, -0.689056396484375, -0.61407470703125, -0.539093017578125, -0.464111328125, -0.389129638671875, -0.31414794921875, -0.239166259765625, -0.1641845703125, -0.089202880859375, -0.01422119140625, 0.060760498046875, 0.1357421875, 0.210723876953125, 0.28570556640625, 0.360687255859375, 0.4356689453125, 0.510650634765625, 0.58563232421875, 0.660614013671875, 0.735595703125, 0.810577392578125, 0.88555908203125, 0.960540771484375, 1.0355224609375, 1.110504150390625, 1.18548583984375, 1.260467529296875, 1.33544921875, 1.410430908203125, 1.48541259765625, 1.560394287109375, 1.6353759765625, 1.710357666015625, 1.78533935546875, 1.860321044921875, 1.935302734375, 2.010284423828125, 2.08526611328125, 2.160247802734375, 2.2352294921875, 2.310211181640625, 2.38519287109375, 2.460174560546875, 2.53515625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 6.0, 5.0, 8.0, 0.0, 13.0, 13.0, 11.0, 15.0, 18.0, 24.0, 16.0, 31.0, 17.0, 32.0, 33.0, 41.0, 41.0, 48.0, 57.0, 51.0, 56.0, 35.0, 51.0, 55.0, 39.0, 47.0, 29.0, 37.0, 18.0, 23.0, 24.0, 10.0, 20.0, 15.0, 9.0, 9.0, 9.0, 7.0, 6.0, 7.0, 6.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004322052001953125, -0.004184305667877197, -0.0040465593338012695, -0.003908812999725342, -0.003771066665649414, -0.0036333203315734863, -0.0034955739974975586, -0.003357827663421631, -0.003220081329345703, -0.0030823349952697754, -0.0029445886611938477, -0.00280684232711792, -0.002669095993041992, -0.0025313496589660645, -0.0023936033248901367, -0.002255856990814209, -0.0021181106567382812, -0.0019803643226623535, -0.0018426179885864258, -0.001704871654510498, -0.0015671253204345703, -0.0014293789863586426, -0.0012916326522827148, -0.0011538863182067871, -0.0010161399841308594, -0.0008783936500549316, -0.0007406473159790039, -0.0006029009819030762, -0.00046515464782714844, -0.0003274083137512207, -0.00018966197967529297, -5.1915645599365234e-05, 8.58306884765625e-05, 0.00022357702255249023, 0.00036132335662841797, 0.0004990696907043457, 0.0006368160247802734, 0.0007745623588562012, 0.0009123086929321289, 0.0010500550270080566, 0.0011878013610839844, 0.0013255476951599121, 0.0014632940292358398, 0.0016010403633117676, 0.0017387866973876953, 0.001876533031463623, 0.0020142793655395508, 0.0021520256996154785, 0.0022897720336914062, 0.002427518367767334, 0.0025652647018432617, 0.0027030110359191895, 0.002840757369995117, 0.002978503704071045, 0.0031162500381469727, 0.0032539963722229004, 0.003391742706298828, 0.003529489040374756, 0.0036672353744506836, 0.0038049817085266113, 0.003942728042602539, 0.004080474376678467, 0.0042182207107543945, 0.004355967044830322, 0.00449371337890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 4.0, 4.0, 0.0, 9.0, 10.0, 17.0, 10.0, 17.0, 17.0, 25.0, 30.0, 41.0, 45.0, 42.0, 60.0, 81.0, 126.0, 152.0, 278.0, 401.0, 840.0, 10289.0, 943138.0, 89694.0, 1596.0, 467.0, 331.0, 181.0, 133.0, 111.0, 64.0, 63.0, 58.0, 27.0, 32.0, 27.0, 23.0, 28.0, 11.0, 18.0, 7.0, 12.0, 11.0, 6.0, 8.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.08740234375, -0.0848093032836914, -0.08221626281738281, -0.07962322235107422, -0.07703018188476562, -0.07443714141845703, -0.07184410095214844, -0.06925106048583984, -0.06665802001953125, -0.06406497955322266, -0.06147193908691406, -0.05887889862060547, -0.056285858154296875, -0.05369281768798828, -0.05109977722167969, -0.048506736755371094, -0.0459136962890625, -0.043320655822753906, -0.04072761535644531, -0.03813457489013672, -0.035541534423828125, -0.03294849395751953, -0.030355453491210938, -0.027762413024902344, -0.02516937255859375, -0.022576332092285156, -0.019983291625976562, -0.01739025115966797, -0.014797210693359375, -0.012204170227050781, -0.009611129760742188, -0.007018089294433594, -0.004425048828125, -0.0018320083618164062, 0.0007610321044921875, 0.0033540725708007812, 0.005947113037109375, 0.008540153503417969, 0.011133193969726562, 0.013726234436035156, 0.01631927490234375, 0.018912315368652344, 0.021505355834960938, 0.02409839630126953, 0.026691436767578125, 0.02928447723388672, 0.03187751770019531, 0.034470558166503906, 0.0370635986328125, 0.039656639099121094, 0.04224967956542969, 0.04484272003173828, 0.047435760498046875, 0.05002880096435547, 0.05262184143066406, 0.055214881896972656, 0.05780792236328125, 0.060400962829589844, 0.06299400329589844, 0.06558704376220703, 0.06818008422851562, 0.07077312469482422, 0.07336616516113281, 0.0759592056274414, 0.07855224609375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 17.0, 42.0, 107.0, 226.0, 270.0, 200.0, 87.0, 38.0, 12.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030136879067867994, -0.0027706336695700884, -0.002527579665184021, -0.00228452542796731, -0.002041471190750599, -0.0017984170699492097, -0.0015553629491478205, -0.0013123087119311094, -0.0010692545911297202, -0.0008262004121206701, -0.00058314623311162, -0.00034009211231023073, -9.70379333011806e-05, 0.00014601624570786953, 0.00038907036650925875, 0.0006321246037259698, 0.000875178724527359, 0.0011182328453287482, 0.0013612870825454593, 0.0016043412033468485, 0.0018473954405635595, 0.002090449444949627, 0.002333503682166338, 0.002576557919383049, 0.00281961215659976, 0.003062666393816471, 0.0033057203982025385, 0.0035487746354192495, 0.0037918288726359606, 0.004034882877022028, 0.004277937114238739, 0.00452099135145545, 0.004764045123010874, 0.005007099360227585, 0.005250153597444296, 0.005493207834661007, 0.005736261606216431, 0.005979315843433142, 0.006222370080649853, 0.006465424317866564, 0.006708478555083275, 0.006951532792299986, 0.007194587029516697, 0.007437640801072121, 0.007680695038288832, 0.007923749275505543, 0.008166803047060966, 0.008409857749938965, 0.008652911521494389, 0.008895965293049812, 0.00913901999592781, 0.009382073767483234, 0.009625128470361233, 0.009868182241916656, 0.010111236944794655, 0.010354290716350079, 0.010597345419228077, 0.0108403991907835, 0.011083453893661499, 0.011326507665216923, 0.011569562368094921, 0.011812616139650345, 0.012055670842528343, 0.012298724614083767, 0.01254177838563919]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 10.0, 14.0, 14.0, 16.0, 18.0, 11.0, 25.0, 19.0, 18.0, 32.0, 29.0, 24.0, 25.0, 30.0, 33.0, 30.0, 36.0, 41.0, 46.0, 30.0, 38.0, 25.0, 40.0, 34.0, 31.0, 23.0, 32.0, 33.0, 23.0, 26.0, 23.0, 16.0, 23.0, 25.0, 12.0, 11.0, 13.0, 13.0, 9.0, 8.0, 6.0, 4.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0023661255836486816, -0.002292144112288952, -0.002218162640929222, -0.0021441811695694923, -0.0020701996982097626, -0.001996218226850033, -0.001922236755490303, -0.0018482552841305733, -0.0017742738127708435, -0.0017002923414111137, -0.001626310870051384, -0.0015523293986916542, -0.0014783479273319244, -0.0014043664559721947, -0.001330384984612465, -0.0012564035132527351, -0.0011824220418930054, -0.0011084405705332756, -0.0010344590991735458, -0.0009604776278138161, -0.0008864961564540863, -0.0008125146850943565, -0.0007385332137346268, -0.000664551742374897, -0.0005905702710151672, -0.0005165887996554375, -0.0004426073282957077, -0.00036862585693597794, -0.00029464438557624817, -0.0002206629142165184, -0.00014668144285678864, -7.269997149705887e-05, 1.2814998626708984e-06, 7.526297122240067e-05, 0.00014924444258213043, 0.0002232259139418602, 0.00029720738530158997, 0.00037118885666131973, 0.0004451703280210495, 0.0005191517993807793, 0.000593133270740509, 0.0006671147421002388, 0.0007410962134599686, 0.0008150776848196983, 0.0008890591561794281, 0.0009630406275391579, 0.0010370220988988876, 0.0011110035702586174, 0.0011849850416183472, 0.001258966512978077, 0.0013329479843378067, 0.0014069294556975365, 0.0014809109270572662, 0.001554892398416996, 0.0016288738697767258, 0.0017028553411364555, 0.0017768368124961853, 0.001850818283855915, 0.0019247997552156448, 0.0019987812265753746, 0.0020727626979351044, 0.002146744169294834, 0.002220725640654564, 0.0022947071120142937, 0.0023686885833740234]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 4.0, 6.0, 5.0, 3.0, 2.0, 8.0, 11.0, 12.0, 11.0, 12.0, 14.0, 26.0, 13.0, 18.0, 24.0, 26.0, 25.0, 26.0, 32.0, 38.0, 35.0, 42.0, 36.0, 38.0, 40.0, 44.0, 31.0, 41.0, 37.0, 23.0, 37.0, 34.0, 22.0, 25.0, 27.0, 31.0, 13.0, 21.0, 15.0, 20.0, 18.0, 15.0, 5.0, 10.0, 7.0, 6.0, 5.0, 0.0, 6.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.609375, -20.928466796875, -20.24755859375, -19.566650390625, -18.8857421875, -18.204833984375, -17.52392578125, -16.843017578125, -16.162109375, -15.481201171875, -14.80029296875, -14.119384765625, -13.4384765625, -12.757568359375, -12.07666015625, -11.395751953125, -10.71484375, -10.033935546875, -9.35302734375, -8.672119140625, -7.9912109375, -7.310302734375, -6.62939453125, -5.948486328125, -5.267578125, -4.586669921875, -3.90576171875, -3.224853515625, -2.5439453125, -1.863037109375, -1.18212890625, -0.501220703125, 0.1796875, 0.860595703125, 1.54150390625, 2.222412109375, 2.9033203125, 3.584228515625, 4.26513671875, 4.946044921875, 5.626953125, 6.307861328125, 6.98876953125, 7.669677734375, 8.3505859375, 9.031494140625, 9.71240234375, 10.393310546875, 11.07421875, 11.755126953125, 12.43603515625, 13.116943359375, 13.7978515625, 14.478759765625, 15.15966796875, 15.840576171875, 16.521484375, 17.202392578125, 17.88330078125, 18.564208984375, 19.2451171875, 19.926025390625, 20.60693359375, 21.287841796875, 21.96875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 8.0, 0.0, 11.0, 18.0, 11.0, 20.0, 11.0, 21.0, 41.0, 43.0, 55.0, 60.0, 86.0, 123.0, 170.0, 200.0, 341.0, 538.0, 866.0, 1496.0, 2831.0, 5969.0, 15045.0, 58115.0, 543761.0, 351033.0, 43665.0, 12516.0, 5066.0, 2554.0, 1407.0, 749.0, 504.0, 329.0, 249.0, 177.0, 110.0, 94.0, 68.0, 48.0, 42.0, 29.0, 17.0, 19.0, 13.0, 8.0, 6.0, 3.0, 8.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.78125, -32.72265625, -31.6640625, -30.60546875, -29.546875, -28.48828125, -27.4296875, -26.37109375, -25.3125, -24.25390625, -23.1953125, -22.13671875, -21.078125, -20.01953125, -18.9609375, -17.90234375, -16.84375, -15.78515625, -14.7265625, -13.66796875, -12.609375, -11.55078125, -10.4921875, -9.43359375, -8.375, -7.31640625, -6.2578125, -5.19921875, -4.140625, -3.08203125, -2.0234375, -0.96484375, 0.09375, 1.15234375, 2.2109375, 3.26953125, 4.328125, 5.38671875, 6.4453125, 7.50390625, 8.5625, 9.62109375, 10.6796875, 11.73828125, 12.796875, 13.85546875, 14.9140625, 15.97265625, 17.03125, 18.08984375, 19.1484375, 20.20703125, 21.265625, 22.32421875, 23.3828125, 24.44140625, 25.5, 26.55859375, 27.6171875, 28.67578125, 29.734375, 30.79296875, 31.8515625, 32.91015625, 33.96875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 5.0, 4.0, 10.0, 5.0, 4.0, 15.0, 14.0, 15.0, 7.0, 18.0, 28.0, 23.0, 27.0, 43.0, 40.0, 37.0, 59.0, 51.0, 71.0, 108.0, 213.0, 1659.0, 133.0, 77.0, 57.0, 48.0, 43.0, 33.0, 28.0, 19.0, 31.0, 19.0, 19.0, 24.0, 14.0, 9.0, 7.0, 5.0, 9.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-69.3125, -67.40283203125, -65.4931640625, -63.58349609375, -61.673828125, -59.76416015625, -57.8544921875, -55.94482421875, -54.03515625, -52.12548828125, -50.2158203125, -48.30615234375, -46.396484375, -44.48681640625, -42.5771484375, -40.66748046875, -38.7578125, -36.84814453125, -34.9384765625, -33.02880859375, -31.119140625, -29.20947265625, -27.2998046875, -25.39013671875, -23.48046875, -21.57080078125, -19.6611328125, -17.75146484375, -15.841796875, -13.93212890625, -12.0224609375, -10.11279296875, -8.203125, -6.29345703125, -4.3837890625, -2.47412109375, -0.564453125, 1.34521484375, 3.2548828125, 5.16455078125, 7.07421875, 8.98388671875, 10.8935546875, 12.80322265625, 14.712890625, 16.62255859375, 18.5322265625, 20.44189453125, 22.3515625, 24.26123046875, 26.1708984375, 28.08056640625, 29.990234375, 31.89990234375, 33.8095703125, 35.71923828125, 37.62890625, 39.53857421875, 41.4482421875, 43.35791015625, 45.267578125, 47.17724609375, 49.0869140625, 50.99658203125, 52.90625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 6.0, 12.0, 22.0, 31.0, 37.0, 49.0, 79.0, 134.0, 192.0, 340.0, 1066.0, 5566.0, 147666.0, 2969745.0, 17394.0, 2053.0, 554.0, 257.0, 160.0, 97.0, 60.0, 49.0, 44.0, 27.0, 21.0, 11.0, 6.0, 3.0, 6.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-128.375, -124.7314453125, -121.087890625, -117.4443359375, -113.80078125, -110.1572265625, -106.513671875, -102.8701171875, -99.2265625, -95.5830078125, -91.939453125, -88.2958984375, -84.65234375, -81.0087890625, -77.365234375, -73.7216796875, -70.078125, -66.4345703125, -62.791015625, -59.1474609375, -55.50390625, -51.8603515625, -48.216796875, -44.5732421875, -40.9296875, -37.2861328125, -33.642578125, -29.9990234375, -26.35546875, -22.7119140625, -19.068359375, -15.4248046875, -11.78125, -8.1376953125, -4.494140625, -0.8505859375, 2.79296875, 6.4365234375, 10.080078125, 13.7236328125, 17.3671875, 21.0107421875, 24.654296875, 28.2978515625, 31.94140625, 35.5849609375, 39.228515625, 42.8720703125, 46.515625, 50.1591796875, 53.802734375, 57.4462890625, 61.08984375, 64.7333984375, 68.376953125, 72.0205078125, 75.6640625, 79.3076171875, 82.951171875, 86.5947265625, 90.23828125, 93.8818359375, 97.525390625, 101.1689453125, 104.8125]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 36.0, 484.0, 463.0, 30.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.65215301513672, -77.00796508789062, -67.36376953125, -57.719581604003906, -48.07539367675781, -38.43120574951172, -28.78701400756836, -19.142822265625, -9.498634338378906, 0.1455554962158203, 9.789745330810547, 19.433935165405273, 29.078125, 38.722312927246094, 48.36650466918945, 58.01069641113281, 67.6548843383789, 77.299072265625, 86.94326782226562, 96.58745574951172, 106.23164367675781, 115.8758316040039, 125.52001953125, 135.16421508789062, 144.80841064453125, 154.45260620117188, 164.09678649902344, 173.74098205566406, 183.38516235351562, 193.02935791015625, 202.67355346679688, 212.3177490234375, 221.9619140625, 231.60610961914062, 241.2502899169922, 250.8944854736328, 260.5386657714844, 270.182861328125, 279.8270568847656, 289.47125244140625, 299.11541748046875, 308.7596130371094, 318.40380859375, 328.0479736328125, 337.6921691894531, 347.33636474609375, 356.9805603027344, 366.624755859375, 376.2689514160156, 385.91314697265625, 395.5573425292969, 405.2015075683594, 414.845703125, 424.4898986816406, 434.13409423828125, 443.7782897949219, 453.4224853515625, 463.0666809082031, 472.71087646484375, 482.35504150390625, 491.9992370605469, 501.6434326171875, 511.2876281738281, 520.9318237304688, 530.5759887695312]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 3.0, 7.0, 6.0, 12.0, 14.0, 7.0, 11.0, 17.0, 15.0, 23.0, 20.0, 20.0, 25.0, 23.0, 20.0, 28.0, 33.0, 29.0, 44.0, 40.0, 39.0, 46.0, 41.0, 43.0, 32.0, 46.0, 36.0, 25.0, 33.0, 34.0, 21.0, 22.0, 10.0, 26.0, 16.0, 21.0, 24.0, 14.0, 14.0, 11.0, 9.0, 5.0, 7.0, 5.0, 1.0, 3.0, 2.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-116.685302734375, -112.95306396484375, -109.22083282470703, -105.48859405517578, -101.75636291503906, -98.02412414550781, -94.29188537597656, -90.55964660644531, -86.8274154663086, -83.09517669677734, -79.36294555664062, -75.63070678710938, -71.89846801757812, -68.1662368774414, -64.43399810791016, -60.70176315307617, -56.96952819824219, -53.2372932434082, -49.50505828857422, -45.77281951904297, -42.040584564208984, -38.308349609375, -34.57611083984375, -30.843875885009766, -27.11164093017578, -23.379405975341797, -19.64716911315918, -15.914933204650879, -12.182697296142578, -8.450462341308594, -4.718225479125977, -0.9859886169433594, 2.746246337890625, 6.478482246398926, 10.210718154907227, 13.942954063415527, 17.675189971923828, 21.407424926757812, 25.13966178894043, 28.871898651123047, 32.60413360595703, 36.336368560791016, 40.068603515625, 43.80084228515625, 47.533077239990234, 51.26531219482422, 54.99755096435547, 58.72978591918945, 62.46202087402344, 66.19425964355469, 69.9264907836914, 73.65872955322266, 77.39096069335938, 81.12319946289062, 84.85543823242188, 88.58767700195312, 92.31990814208984, 96.0521469116211, 99.78437805175781, 103.51661682128906, 107.24885559082031, 110.98108673095703, 114.71332550048828, 118.445556640625, 122.17779541015625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 6.0, 5.0, 8.0, 6.0, 10.0, 10.0, 15.0, 12.0, 17.0, 25.0, 19.0, 29.0, 27.0, 24.0, 27.0, 23.0, 29.0, 31.0, 39.0, 46.0, 46.0, 34.0, 43.0, 36.0, 33.0, 32.0, 37.0, 26.0, 31.0, 33.0, 23.0, 27.0, 27.0, 13.0, 25.0, 21.0, 22.0, 11.0, 14.0, 9.0, 9.0, 9.0, 5.0, 2.0, 4.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0], "bins": [-22.3125, -21.6357421875, -20.958984375, -20.2822265625, -19.60546875, -18.9287109375, -18.251953125, -17.5751953125, -16.8984375, -16.2216796875, -15.544921875, -14.8681640625, -14.19140625, -13.5146484375, -12.837890625, -12.1611328125, -11.484375, -10.8076171875, -10.130859375, -9.4541015625, -8.77734375, -8.1005859375, -7.423828125, -6.7470703125, -6.0703125, -5.3935546875, -4.716796875, -4.0400390625, -3.36328125, -2.6865234375, -2.009765625, -1.3330078125, -0.65625, 0.0205078125, 0.697265625, 1.3740234375, 2.05078125, 2.7275390625, 3.404296875, 4.0810546875, 4.7578125, 5.4345703125, 6.111328125, 6.7880859375, 7.46484375, 8.1416015625, 8.818359375, 9.4951171875, 10.171875, 10.8486328125, 11.525390625, 12.2021484375, 12.87890625, 13.5556640625, 14.232421875, 14.9091796875, 15.5859375, 16.2626953125, 16.939453125, 17.6162109375, 18.29296875, 18.9697265625, 19.646484375, 20.3232421875, 21.0]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 7.0, 9.0, 9.0, 8.0, 19.0, 19.0, 27.0, 42.0, 56.0, 69.0, 106.0, 144.0, 217.0, 348.0, 532.0, 778.0, 1369.0, 2267.0, 4451.0, 9416.0, 25007.0, 295633.0, 3290107.0, 506893.0, 34097.0, 11180.0, 4983.0, 2622.0, 1431.0, 820.0, 558.0, 347.0, 216.0, 141.0, 106.0, 73.0, 54.0, 31.0, 21.0, 15.0, 13.0, 7.0, 18.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-64.25, -62.3369140625, -60.423828125, -58.5107421875, -56.59765625, -54.6845703125, -52.771484375, -50.8583984375, -48.9453125, -47.0322265625, -45.119140625, -43.2060546875, -41.29296875, -39.3798828125, -37.466796875, -35.5537109375, -33.640625, -31.7275390625, -29.814453125, -27.9013671875, -25.98828125, -24.0751953125, -22.162109375, -20.2490234375, -18.3359375, -16.4228515625, -14.509765625, -12.5966796875, -10.68359375, -8.7705078125, -6.857421875, -4.9443359375, -3.03125, -1.1181640625, 0.794921875, 2.7080078125, 4.62109375, 6.5341796875, 8.447265625, 10.3603515625, 12.2734375, 14.1865234375, 16.099609375, 18.0126953125, 19.92578125, 21.8388671875, 23.751953125, 25.6650390625, 27.578125, 29.4912109375, 31.404296875, 33.3173828125, 35.23046875, 37.1435546875, 39.056640625, 40.9697265625, 42.8828125, 44.7958984375, 46.708984375, 48.6220703125, 50.53515625, 52.4482421875, 54.361328125, 56.2744140625, 58.1875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 2.0, 8.0, 12.0, 9.0, 14.0, 19.0, 28.0, 38.0, 47.0, 82.0, 126.0, 237.0, 488.0, 805.0, 901.0, 532.0, 283.0, 142.0, 69.0, 50.0, 40.0, 33.0, 15.0, 18.0, 11.0, 10.0, 14.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.0625, -39.69970703125, -38.3369140625, -36.97412109375, -35.611328125, -34.24853515625, -32.8857421875, -31.52294921875, -30.16015625, -28.79736328125, -27.4345703125, -26.07177734375, -24.708984375, -23.34619140625, -21.9833984375, -20.62060546875, -19.2578125, -17.89501953125, -16.5322265625, -15.16943359375, -13.806640625, -12.44384765625, -11.0810546875, -9.71826171875, -8.35546875, -6.99267578125, -5.6298828125, -4.26708984375, -2.904296875, -1.54150390625, -0.1787109375, 1.18408203125, 2.546875, 3.90966796875, 5.2724609375, 6.63525390625, 7.998046875, 9.36083984375, 10.7236328125, 12.08642578125, 13.44921875, 14.81201171875, 16.1748046875, 17.53759765625, 18.900390625, 20.26318359375, 21.6259765625, 22.98876953125, 24.3515625, 25.71435546875, 27.0771484375, 28.43994140625, 29.802734375, 31.16552734375, 32.5283203125, 33.89111328125, 35.25390625, 36.61669921875, 37.9794921875, 39.34228515625, 40.705078125, 42.06787109375, 43.4306640625, 44.79345703125, 46.15625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 9.0, 4.0, 15.0, 14.0, 18.0, 21.0, 39.0, 50.0, 80.0, 113.0, 194.0, 265.0, 461.0, 684.0, 1116.0, 1894.0, 3244.0, 6032.0, 11691.0, 25724.0, 74978.0, 531550.0, 3204877.0, 238279.0, 51883.0, 19698.0, 9387.0, 4883.0, 2715.0, 1559.0, 1027.0, 642.0, 384.0, 260.0, 154.0, 98.0, 70.0, 54.0, 33.0, 23.0, 16.0, 18.0, 9.0, 8.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-54.65625, -53.06494140625, -51.4736328125, -49.88232421875, -48.291015625, -46.69970703125, -45.1083984375, -43.51708984375, -41.92578125, -40.33447265625, -38.7431640625, -37.15185546875, -35.560546875, -33.96923828125, -32.3779296875, -30.78662109375, -29.1953125, -27.60400390625, -26.0126953125, -24.42138671875, -22.830078125, -21.23876953125, -19.6474609375, -18.05615234375, -16.46484375, -14.87353515625, -13.2822265625, -11.69091796875, -10.099609375, -8.50830078125, -6.9169921875, -5.32568359375, -3.734375, -2.14306640625, -0.5517578125, 1.03955078125, 2.630859375, 4.22216796875, 5.8134765625, 7.40478515625, 8.99609375, 10.58740234375, 12.1787109375, 13.77001953125, 15.361328125, 16.95263671875, 18.5439453125, 20.13525390625, 21.7265625, 23.31787109375, 24.9091796875, 26.50048828125, 28.091796875, 29.68310546875, 31.2744140625, 32.86572265625, 34.45703125, 36.04833984375, 37.6396484375, 39.23095703125, 40.822265625, 42.41357421875, 44.0048828125, 45.59619140625, 47.1875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [5.0, 4.0, 5.0, 23.0, 47.0, 136.0, 277.0, 316.0, 139.0, 43.0, 19.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.50608825683594, -63.90240478515625, -53.2987174987793, -42.695030212402344, -32.091346740722656, -21.48766326904297, -10.883975982666016, -0.2802886962890625, 10.323394775390625, 20.927080154418945, 31.530765533447266, 42.13445281982422, 52.738136291503906, 63.341819763183594, 73.94551086425781, 84.5491943359375, 95.15287780761719, 105.75656127929688, 116.36024475097656, 126.96393585205078, 137.567626953125, 148.17129516601562, 158.77499389648438, 169.37867736816406, 179.98236083984375, 190.58604431152344, 201.18972778320312, 211.7934112548828, 222.3970947265625, 233.00079345703125, 243.60447692871094, 254.20816040039062, 264.81182861328125, 275.41552734375, 286.0191955566406, 296.6228942871094, 307.2265625, 317.83026123046875, 328.4339294433594, 339.0376281738281, 349.64129638671875, 360.2449951171875, 370.8486633300781, 381.4523620605469, 392.0560302734375, 402.65972900390625, 413.2633972167969, 423.8670959472656, 434.4707946777344, 445.0744934082031, 455.67816162109375, 466.2818603515625, 476.8855285644531, 487.4892272949219, 498.0928955078125, 508.69659423828125, 519.30029296875, 529.9039916992188, 540.5076904296875, 551.111328125, 561.7150268554688, 572.3187255859375, 582.9224243164062, 593.526123046875, 604.1297607421875]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 0.0, 11.0, 5.0, 5.0, 9.0, 6.0, 13.0, 8.0, 10.0, 12.0, 27.0, 13.0, 29.0, 21.0, 23.0, 26.0, 29.0, 46.0, 33.0, 39.0, 37.0, 32.0, 33.0, 39.0, 41.0, 40.0, 32.0, 41.0, 43.0, 34.0, 45.0, 35.0, 27.0, 30.0, 22.0, 13.0, 17.0, 12.0, 7.0, 10.0, 11.0, 8.0, 5.0, 6.0, 8.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 3.0], "bins": [-108.5338134765625, -105.25873565673828, -101.98365783691406, -98.70858001708984, -95.43350219726562, -92.1584243774414, -88.88334655761719, -85.6082763671875, -82.33319091796875, -79.05811309814453, -75.78303527832031, -72.5079574584961, -69.23287963867188, -65.95780181884766, -62.6827278137207, -59.407649993896484, -56.13257598876953, -52.85749816894531, -49.582420349121094, -46.307342529296875, -43.032264709472656, -39.75718688964844, -36.482112884521484, -33.207035064697266, -29.931957244873047, -26.656879425048828, -23.38180160522461, -20.106725692749023, -16.831647872924805, -13.556570053100586, -10.281494140625, -7.006416320800781, -3.7313385009765625, -0.45626115798950195, 2.8188161849975586, 6.093893051147461, 9.36897087097168, 12.644048690795898, 15.919124603271484, 19.194202423095703, 22.469280242919922, 25.74435806274414, 29.01943588256836, 32.29450988769531, 35.56958770751953, 38.84466552734375, 42.11974334716797, 45.39482116699219, 48.669898986816406, 51.944976806640625, 55.220054626464844, 58.49513244628906, 61.77021026611328, 65.0452880859375, 68.32035827636719, 71.59544372558594, 74.87051391601562, 78.14559173583984, 81.42066955566406, 84.69574737548828, 87.9708251953125, 91.24590301513672, 94.52098083496094, 97.79605102539062, 101.07113647460938]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 11.0, 11.0, 9.0, 10.0, 16.0, 25.0, 29.0, 14.0, 39.0, 38.0, 35.0, 23.0, 28.0, 33.0, 32.0, 42.0, 29.0, 37.0, 35.0, 41.0, 38.0, 41.0, 39.0, 28.0, 41.0, 25.0, 28.0, 35.0, 27.0, 24.0, 14.0, 19.0, 12.0, 16.0, 16.0, 5.0, 12.0, 9.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.09375, -22.355712890625, -21.61767578125, -20.879638671875, -20.1416015625, -19.403564453125, -18.66552734375, -17.927490234375, -17.189453125, -16.451416015625, -15.71337890625, -14.975341796875, -14.2373046875, -13.499267578125, -12.76123046875, -12.023193359375, -11.28515625, -10.547119140625, -9.80908203125, -9.071044921875, -8.3330078125, -7.594970703125, -6.85693359375, -6.118896484375, -5.380859375, -4.642822265625, -3.90478515625, -3.166748046875, -2.4287109375, -1.690673828125, -0.95263671875, -0.214599609375, 0.5234375, 1.261474609375, 1.99951171875, 2.737548828125, 3.4755859375, 4.213623046875, 4.95166015625, 5.689697265625, 6.427734375, 7.165771484375, 7.90380859375, 8.641845703125, 9.3798828125, 10.117919921875, 10.85595703125, 11.593994140625, 12.33203125, 13.070068359375, 13.80810546875, 14.546142578125, 15.2841796875, 16.022216796875, 16.76025390625, 17.498291015625, 18.236328125, 18.974365234375, 19.71240234375, 20.450439453125, 21.1884765625, 21.926513671875, 22.66455078125, 23.402587890625, 24.140625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 8.0, 5.0, 17.0, 25.0, 45.0, 50.0, 78.0, 128.0, 190.0, 289.0, 485.0, 707.0, 1122.0, 1692.0, 2672.0, 4173.0, 6616.0, 10299.0, 16538.0, 26659.0, 43717.0, 75702.0, 141763.0, 277527.0, 195272.0, 99108.0, 55713.0, 32925.0, 20350.0, 12429.0, 7963.0, 5134.0, 3195.0, 2110.0, 1319.0, 888.0, 597.0, 376.0, 234.0, 148.0, 108.0, 67.0, 32.0, 32.0, 20.0, 14.0, 9.0, 6.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.306640625, -2.23614501953125, -2.1656494140625, -2.09515380859375, -2.024658203125, -1.95416259765625, -1.8836669921875, -1.81317138671875, -1.74267578125, -1.67218017578125, -1.6016845703125, -1.53118896484375, -1.460693359375, -1.39019775390625, -1.3197021484375, -1.24920654296875, -1.1787109375, -1.10821533203125, -1.0377197265625, -0.96722412109375, -0.896728515625, -0.82623291015625, -0.7557373046875, -0.68524169921875, -0.61474609375, -0.54425048828125, -0.4737548828125, -0.40325927734375, -0.332763671875, -0.26226806640625, -0.1917724609375, -0.12127685546875, -0.05078125, 0.01971435546875, 0.0902099609375, 0.16070556640625, 0.231201171875, 0.30169677734375, 0.3721923828125, 0.44268798828125, 0.51318359375, 0.58367919921875, 0.6541748046875, 0.72467041015625, 0.795166015625, 0.86566162109375, 0.9361572265625, 1.00665283203125, 1.0771484375, 1.14764404296875, 1.2181396484375, 1.28863525390625, 1.359130859375, 1.42962646484375, 1.5001220703125, 1.57061767578125, 1.64111328125, 1.71160888671875, 1.7821044921875, 1.85260009765625, 1.923095703125, 1.99359130859375, 2.0640869140625, 2.13458251953125, 2.205078125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 10.0, 9.0, 9.0, 9.0, 13.0, 7.0, 15.0, 18.0, 18.0, 31.0, 41.0, 34.0, 41.0, 45.0, 40.0, 28.0, 62.0, 48.0, 1072.0, 45.0, 35.0, 44.0, 47.0, 44.0, 42.0, 30.0, 25.0, 18.0, 27.0, 14.0, 19.0, 22.0, 21.0, 14.0, 8.0, 10.0, 8.0, 3.0, 7.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-20.59375, -20.0361328125, -19.478515625, -18.9208984375, -18.36328125, -17.8056640625, -17.248046875, -16.6904296875, -16.1328125, -15.5751953125, -15.017578125, -14.4599609375, -13.90234375, -13.3447265625, -12.787109375, -12.2294921875, -11.671875, -11.1142578125, -10.556640625, -9.9990234375, -9.44140625, -8.8837890625, -8.326171875, -7.7685546875, -7.2109375, -6.6533203125, -6.095703125, -5.5380859375, -4.98046875, -4.4228515625, -3.865234375, -3.3076171875, -2.75, -2.1923828125, -1.634765625, -1.0771484375, -0.51953125, 0.0380859375, 0.595703125, 1.1533203125, 1.7109375, 2.2685546875, 2.826171875, 3.3837890625, 3.94140625, 4.4990234375, 5.056640625, 5.6142578125, 6.171875, 6.7294921875, 7.287109375, 7.8447265625, 8.40234375, 8.9599609375, 9.517578125, 10.0751953125, 10.6328125, 11.1904296875, 11.748046875, 12.3056640625, 12.86328125, 13.4208984375, 13.978515625, 14.5361328125, 15.09375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 8.0, 4.0, 6.0, 8.0, 10.0, 17.0, 33.0, 40.0, 69.0, 98.0, 144.0, 230.0, 370.0, 683.0, 1011.0, 1714.0, 3311.0, 5767.0, 10412.0, 19320.0, 38299.0, 78067.0, 184806.0, 1415555.0, 179667.0, 77141.0, 37570.0, 19193.0, 10311.0, 5553.0, 3269.0, 1798.0, 1055.0, 585.0, 370.0, 229.0, 134.0, 104.0, 66.0, 37.0, 27.0, 16.0, 13.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76171875, -2.668060302734375, -2.57440185546875, -2.480743408203125, -2.3870849609375, -2.293426513671875, -2.19976806640625, -2.106109619140625, -2.012451171875, -1.918792724609375, -1.82513427734375, -1.731475830078125, -1.6378173828125, -1.544158935546875, -1.45050048828125, -1.356842041015625, -1.26318359375, -1.169525146484375, -1.07586669921875, -0.982208251953125, -0.8885498046875, -0.794891357421875, -0.70123291015625, -0.607574462890625, -0.513916015625, -0.420257568359375, -0.32659912109375, -0.232940673828125, -0.1392822265625, -0.045623779296875, 0.04803466796875, 0.141693115234375, 0.2353515625, 0.329010009765625, 0.42266845703125, 0.516326904296875, 0.6099853515625, 0.703643798828125, 0.79730224609375, 0.890960693359375, 0.984619140625, 1.078277587890625, 1.17193603515625, 1.265594482421875, 1.3592529296875, 1.452911376953125, 1.54656982421875, 1.640228271484375, 1.73388671875, 1.827545166015625, 1.92120361328125, 2.014862060546875, 2.1085205078125, 2.202178955078125, 2.29583740234375, 2.389495849609375, 2.483154296875, 2.576812744140625, 2.67047119140625, 2.764129638671875, 2.8577880859375, 2.951446533203125, 3.04510498046875, 3.138763427734375, 3.232421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 4.0, 2.0, 3.0, 7.0, 5.0, 11.0, 10.0, 13.0, 15.0, 18.0, 26.0, 18.0, 32.0, 36.0, 49.0, 39.0, 50.0, 47.0, 50.0, 51.0, 47.0, 48.0, 44.0, 57.0, 37.0, 48.0, 34.0, 39.0, 22.0, 24.0, 29.0, 11.0, 12.0, 8.0, 7.0, 8.0, 9.0, 2.0, 9.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.004955291748046875, -0.004797220230102539, -0.004639148712158203, -0.004481077194213867, -0.004323005676269531, -0.004164934158325195, -0.004006862640380859, -0.0038487911224365234, -0.0036907196044921875, -0.0035326480865478516, -0.0033745765686035156, -0.0032165050506591797, -0.0030584335327148438, -0.002900362014770508, -0.002742290496826172, -0.002584218978881836, -0.0024261474609375, -0.002268075942993164, -0.002110004425048828, -0.0019519329071044922, -0.0017938613891601562, -0.0016357898712158203, -0.0014777183532714844, -0.0013196468353271484, -0.0011615753173828125, -0.0010035037994384766, -0.0008454322814941406, -0.0006873607635498047, -0.0005292892456054688, -0.0003712177276611328, -0.00021314620971679688, -5.507469177246094e-05, 0.000102996826171875, 0.00026106834411621094, 0.0004191398620605469, 0.0005772113800048828, 0.0007352828979492188, 0.0008933544158935547, 0.0010514259338378906, 0.0012094974517822266, 0.0013675689697265625, 0.0015256404876708984, 0.0016837120056152344, 0.0018417835235595703, 0.0019998550415039062, 0.002157926559448242, 0.002315998077392578, 0.002474069595336914, 0.00263214111328125, 0.002790212631225586, 0.002948284149169922, 0.003106355667114258, 0.0032644271850585938, 0.0034224987030029297, 0.0035805702209472656, 0.0037386417388916016, 0.0038967132568359375, 0.0040547847747802734, 0.004212856292724609, 0.004370927810668945, 0.004528999328613281, 0.004687070846557617, 0.004845142364501953, 0.005003213882446289, 0.005161285400390625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 1.0, 2.0, 2.0, 5.0, 5.0, 5.0, 4.0, 11.0, 15.0, 12.0, 15.0, 11.0, 16.0, 23.0, 26.0, 53.0, 53.0, 72.0, 91.0, 123.0, 194.0, 255.0, 476.0, 1353.0, 84057.0, 952771.0, 6886.0, 767.0, 368.0, 214.0, 154.0, 111.0, 86.0, 66.0, 50.0, 37.0, 36.0, 36.0, 15.0, 17.0, 14.0, 6.0, 6.0, 4.0, 4.0, 4.0, 6.0, 7.0, 6.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.10198974609375, -0.09892463684082031, -0.09585952758789062, -0.09279441833496094, -0.08972930908203125, -0.08666419982910156, -0.08359909057617188, -0.08053398132324219, -0.0774688720703125, -0.07440376281738281, -0.07133865356445312, -0.06827354431152344, -0.06520843505859375, -0.06214332580566406, -0.059078216552734375, -0.05601310729980469, -0.052947998046875, -0.04988288879394531, -0.046817779541015625, -0.04375267028808594, -0.04068756103515625, -0.03762245178222656, -0.034557342529296875, -0.03149223327636719, -0.0284271240234375, -0.025362014770507812, -0.022296905517578125, -0.019231796264648438, -0.01616668701171875, -0.013101577758789062, -0.010036468505859375, -0.0069713592529296875, -0.00390625, -0.0008411407470703125, 0.002223968505859375, 0.0052890777587890625, 0.00835418701171875, 0.011419296264648438, 0.014484405517578125, 0.017549514770507812, 0.0206146240234375, 0.023679733276367188, 0.026744842529296875, 0.029809951782226562, 0.03287506103515625, 0.03594017028808594, 0.039005279541015625, 0.04207038879394531, 0.045135498046875, 0.04820060729980469, 0.051265716552734375, 0.05433082580566406, 0.05739593505859375, 0.06046104431152344, 0.06352615356445312, 0.06659126281738281, 0.0696563720703125, 0.07272148132324219, 0.07578659057617188, 0.07885169982910156, 0.08191680908203125, 0.08498191833496094, 0.08804702758789062, 0.09111213684082031, 0.09417724609375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 28.0, 107.0, 472.0, 342.0, 60.0, 7.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030196052975952625, -0.0025031291879713535, -0.0019866530783474445, -0.0014701769687235355, -0.0009537008590996265, -0.00043722474947571754, 7.925136014819145e-05, 0.0005957274697721004, 0.0011122035793960094, 0.0016286796890199184, 0.0021451557986438274, 0.0026616319082677364, 0.0031781080178916454, 0.0036945841275155544, 0.004211060237139463, 0.004727536346763372, 0.005244012456387281, 0.00576048856601119, 0.006276964675635099, 0.006793440785259008, 0.007309916894882917, 0.007826393470168114, 0.008342869579792023, 0.008859345689415932, 0.00937582179903984, 0.00989229790866375, 0.010408774018287659, 0.010925250127911568, 0.011441726237535477, 0.011958202347159386, 0.012474678456783295, 0.012991154566407204, 0.013507630676031113, 0.014024106785655022, 0.01454058289527893, 0.01505705900490284, 0.015573535114526749, 0.016090011224150658, 0.016606487333774567, 0.017122963443398476, 0.017639439553022385, 0.018155915662646294, 0.018672391772270203, 0.01918886788189411, 0.01970534399151802, 0.02022182010114193, 0.02073829621076584, 0.021254772320389748, 0.021771248430013657, 0.022287724539637566, 0.022804200649261475, 0.023320676758885384, 0.023837152868509293, 0.0243536289781332, 0.02487010508775711, 0.02538658119738102, 0.02590305730700493, 0.026419533416628838, 0.026936009526252747, 0.027452485635876656, 0.027968961745500565, 0.028485437855124474, 0.029001913964748383, 0.02951839007437229, 0.0300348661839962]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 1.0, 9.0, 3.0, 6.0, 7.0, 10.0, 9.0, 8.0, 14.0, 15.0, 20.0, 20.0, 26.0, 32.0, 26.0, 30.0, 39.0, 34.0, 38.0, 48.0, 39.0, 39.0, 41.0, 48.0, 39.0, 32.0, 40.0, 34.0, 29.0, 28.0, 24.0, 31.0, 28.0, 25.0, 21.0, 23.0, 23.0, 12.0, 10.0, 7.0, 4.0, 9.0, 5.0, 2.0, 8.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.0032747983932495117, -0.003180675208568573, -0.0030865520238876343, -0.0029924288392066956, -0.002898305654525757, -0.002804182469844818, -0.0027100592851638794, -0.0026159361004829407, -0.002521812915802002, -0.0024276897311210632, -0.0023335665464401245, -0.002239443361759186, -0.002145320177078247, -0.0020511969923973083, -0.0019570738077163696, -0.001862950623035431, -0.0017688274383544922, -0.0016747042536735535, -0.0015805810689926147, -0.001486457884311676, -0.0013923346996307373, -0.0012982115149497986, -0.0012040883302688599, -0.0011099651455879211, -0.0010158419609069824, -0.0009217187762260437, -0.000827595591545105, -0.0007334724068641663, -0.0006393492221832275, -0.0005452260375022888, -0.0004511028528213501, -0.0003569796681404114, -0.00026285648345947266, -0.00016873329877853394, -7.461011409759521e-05, 1.9513070583343506e-05, 0.00011363625526428223, 0.00020775943994522095, 0.00030188262462615967, 0.0003960058093070984, 0.0004901289939880371, 0.0005842521786689758, 0.0006783753633499146, 0.0007724985480308533, 0.000866621732711792, 0.0009607449173927307, 0.0010548681020736694, 0.0011489912867546082, 0.0012431144714355469, 0.0013372376561164856, 0.0014313608407974243, 0.001525484025478363, 0.0016196072101593018, 0.0017137303948402405, 0.0018078535795211792, 0.001901976764202118, 0.0019960999488830566, 0.0020902231335639954, 0.002184346318244934, 0.002278469502925873, 0.0023725926876068115, 0.0024667158722877502, 0.002560839056968689, 0.0026549622416496277, 0.0027490854263305664]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 7.0, 12.0, 10.0, 9.0, 10.0, 16.0, 25.0, 29.0, 14.0, 39.0, 38.0, 35.0, 23.0, 28.0, 33.0, 32.0, 42.0, 29.0, 37.0, 35.0, 41.0, 38.0, 41.0, 39.0, 28.0, 41.0, 25.0, 28.0, 35.0, 27.0, 24.0, 14.0, 20.0, 11.0, 16.0, 16.0, 5.0, 12.0, 9.0, 3.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.09375, -22.355712890625, -21.61767578125, -20.879638671875, -20.1416015625, -19.403564453125, -18.66552734375, -17.927490234375, -17.189453125, -16.451416015625, -15.71337890625, -14.975341796875, -14.2373046875, -13.499267578125, -12.76123046875, -12.023193359375, -11.28515625, -10.547119140625, -9.80908203125, -9.071044921875, -8.3330078125, -7.594970703125, -6.85693359375, -6.118896484375, -5.380859375, -4.642822265625, -3.90478515625, -3.166748046875, -2.4287109375, -1.690673828125, -0.95263671875, -0.214599609375, 0.5234375, 1.261474609375, 1.99951171875, 2.737548828125, 3.4755859375, 4.213623046875, 4.95166015625, 5.689697265625, 6.427734375, 7.165771484375, 7.90380859375, 8.641845703125, 9.3798828125, 10.117919921875, 10.85595703125, 11.593994140625, 12.33203125, 13.070068359375, 13.80810546875, 14.546142578125, 15.2841796875, 16.022216796875, 16.76025390625, 17.498291015625, 18.236328125, 18.974365234375, 19.71240234375, 20.450439453125, 21.1884765625, 21.926513671875, 22.66455078125, 23.402587890625, 24.140625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 9.0, 12.0, 17.0, 20.0, 33.0, 55.0, 54.0, 91.0, 108.0, 145.0, 162.0, 273.0, 340.0, 502.0, 638.0, 881.0, 1298.0, 1741.0, 2608.0, 3902.0, 6132.0, 10210.0, 19203.0, 43079.0, 143117.0, 527951.0, 182617.0, 50386.0, 21610.0, 11190.0, 6486.0, 4186.0, 2815.0, 1870.0, 1300.0, 924.0, 627.0, 513.0, 398.0, 278.0, 215.0, 153.0, 107.0, 87.0, 59.0, 44.0, 35.0, 18.0, 11.0, 17.0, 9.0, 7.0, 3.0, 6.0, 1.0, 4.0, 2.0], "bins": [-25.578125, -24.79296875, -24.0078125, -23.22265625, -22.4375, -21.65234375, -20.8671875, -20.08203125, -19.296875, -18.51171875, -17.7265625, -16.94140625, -16.15625, -15.37109375, -14.5859375, -13.80078125, -13.015625, -12.23046875, -11.4453125, -10.66015625, -9.875, -9.08984375, -8.3046875, -7.51953125, -6.734375, -5.94921875, -5.1640625, -4.37890625, -3.59375, -2.80859375, -2.0234375, -1.23828125, -0.453125, 0.33203125, 1.1171875, 1.90234375, 2.6875, 3.47265625, 4.2578125, 5.04296875, 5.828125, 6.61328125, 7.3984375, 8.18359375, 8.96875, 9.75390625, 10.5390625, 11.32421875, 12.109375, 12.89453125, 13.6796875, 14.46484375, 15.25, 16.03515625, 16.8203125, 17.60546875, 18.390625, 19.17578125, 19.9609375, 20.74609375, 21.53125, 22.31640625, 23.1015625, 23.88671875, 24.671875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 11.0, 10.0, 10.0, 7.0, 15.0, 16.0, 13.0, 24.0, 20.0, 33.0, 23.0, 39.0, 34.0, 53.0, 49.0, 67.0, 65.0, 187.0, 1552.0, 274.0, 113.0, 53.0, 51.0, 40.0, 41.0, 33.0, 36.0, 27.0, 15.0, 22.0, 20.0, 5.0, 21.0, 12.0, 13.0, 9.0, 4.0, 4.0, 5.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-60.28125, -58.43798828125, -56.5947265625, -54.75146484375, -52.908203125, -51.06494140625, -49.2216796875, -47.37841796875, -45.53515625, -43.69189453125, -41.8486328125, -40.00537109375, -38.162109375, -36.31884765625, -34.4755859375, -32.63232421875, -30.7890625, -28.94580078125, -27.1025390625, -25.25927734375, -23.416015625, -21.57275390625, -19.7294921875, -17.88623046875, -16.04296875, -14.19970703125, -12.3564453125, -10.51318359375, -8.669921875, -6.82666015625, -4.9833984375, -3.14013671875, -1.296875, 0.54638671875, 2.3896484375, 4.23291015625, 6.076171875, 7.91943359375, 9.7626953125, 11.60595703125, 13.44921875, 15.29248046875, 17.1357421875, 18.97900390625, 20.822265625, 22.66552734375, 24.5087890625, 26.35205078125, 28.1953125, 30.03857421875, 31.8818359375, 33.72509765625, 35.568359375, 37.41162109375, 39.2548828125, 41.09814453125, 42.94140625, 44.78466796875, 46.6279296875, 48.47119140625, 50.314453125, 52.15771484375, 54.0009765625, 55.84423828125, 57.6875]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 12.0, 8.0, 17.0, 27.0, 22.0, 39.0, 44.0, 66.0, 80.0, 136.0, 203.0, 413.0, 1492.0, 11756.0, 1263804.0, 1852710.0, 12100.0, 1624.0, 410.0, 211.0, 149.0, 97.0, 64.0, 48.0, 33.0, 28.0, 20.0, 25.0, 12.0, 11.0, 8.0, 6.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0], "bins": [-146.5, -142.431640625, -138.36328125, -134.294921875, -130.2265625, -126.158203125, -122.08984375, -118.021484375, -113.953125, -109.884765625, -105.81640625, -101.748046875, -97.6796875, -93.611328125, -89.54296875, -85.474609375, -81.40625, -77.337890625, -73.26953125, -69.201171875, -65.1328125, -61.064453125, -56.99609375, -52.927734375, -48.859375, -44.791015625, -40.72265625, -36.654296875, -32.5859375, -28.517578125, -24.44921875, -20.380859375, -16.3125, -12.244140625, -8.17578125, -4.107421875, -0.0390625, 4.029296875, 8.09765625, 12.166015625, 16.234375, 20.302734375, 24.37109375, 28.439453125, 32.5078125, 36.576171875, 40.64453125, 44.712890625, 48.78125, 52.849609375, 56.91796875, 60.986328125, 65.0546875, 69.123046875, 73.19140625, 77.259765625, 81.328125, 85.396484375, 89.46484375, 93.533203125, 97.6015625, 101.669921875, 105.73828125, 109.806640625, 113.875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 33.0, 823.0, 161.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-976.6517944335938, -954.2985229492188, -931.9451904296875, -909.5919189453125, -887.2385864257812, -864.8853149414062, -842.531982421875, -820.1787109375, -797.825439453125, -775.47216796875, -753.1188354492188, -730.7655639648438, -708.4122314453125, -686.0589599609375, -663.7056884765625, -641.3523559570312, -618.9990234375, -596.645751953125, -574.2924194335938, -551.9391479492188, -529.5858154296875, -507.2325439453125, -484.8792419433594, -462.52593994140625, -440.1726379394531, -417.8193359375, -395.4660339355469, -373.11273193359375, -350.75946044921875, -328.4061279296875, -306.0528564453125, -283.6995544433594, -261.3462829589844, -238.99298095703125, -216.63967895507812, -194.28639221191406, -171.93309020996094, -149.5797882080078, -127.22650146484375, -104.87319946289062, -82.5198974609375, -60.16659927368164, -37.81330108642578, -15.460006713867188, 6.8932952880859375, 29.246597290039062, 51.599884033203125, 73.95318603515625, 96.30648803710938, 118.6597900390625, 141.01309204101562, 163.3663787841797, 185.7196807861328, 208.07298278808594, 230.42626953125, 252.77957153320312, 275.13287353515625, 297.4861755371094, 319.8394775390625, 342.1927490234375, 364.54608154296875, 386.89935302734375, 409.2526550292969, 431.60595703125, 453.9592590332031]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 7.0, 5.0, 8.0, 10.0, 10.0, 16.0, 17.0, 13.0, 12.0, 29.0, 27.0, 29.0, 48.0, 28.0, 29.0, 37.0, 33.0, 34.0, 30.0, 43.0, 48.0, 39.0, 39.0, 38.0, 36.0, 38.0, 26.0, 37.0, 25.0, 31.0, 19.0, 27.0, 19.0, 22.0, 19.0, 14.0, 6.0, 14.0, 6.0, 7.0, 12.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0], "bins": [-137.31695556640625, -133.40562438964844, -129.49429321289062, -125.58296203613281, -121.671630859375, -117.76029968261719, -113.84896850585938, -109.93763732910156, -106.02630615234375, -102.11497497558594, -98.20364379882812, -94.29231262207031, -90.3809814453125, -86.46965026855469, -82.55831909179688, -78.64698791503906, -74.73564910888672, -70.8243179321289, -66.9129867553711, -63.00165557861328, -59.09032440185547, -55.178993225097656, -51.26765823364258, -47.356327056884766, -43.44499588012695, -39.53366470336914, -35.62233352661133, -31.711000442504883, -27.79966926574707, -23.888338088989258, -19.977005004882812, -16.065673828125, -12.154342651367188, -8.243011474609375, -4.331679344177246, -0.4203472137451172, 3.4909839630126953, 7.402315139770508, 11.313648223876953, 15.224979400634766, 19.136310577392578, 23.04764175415039, 26.958972930908203, 30.87030601501465, 34.781639099121094, 38.692970275878906, 42.60430145263672, 46.51563262939453, 50.426963806152344, 54.338294982910156, 58.24962615966797, 62.16095733642578, 66.0722885131836, 69.9836196899414, 73.89495849609375, 77.80628967285156, 81.71762084960938, 85.62895202636719, 89.540283203125, 93.45161437988281, 97.36294555664062, 101.27427673339844, 105.18560791015625, 109.09693908691406, 113.00827026367188]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 4.0, 7.0, 4.0, 13.0, 7.0, 19.0, 14.0, 19.0, 15.0, 23.0, 23.0, 35.0, 28.0, 37.0, 30.0, 46.0, 28.0, 27.0, 34.0, 38.0, 41.0, 45.0, 32.0, 38.0, 29.0, 41.0, 39.0, 41.0, 28.0, 21.0, 32.0, 24.0, 24.0, 20.0, 14.0, 13.0, 15.0, 19.0, 9.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.625, -21.870361328125, -21.11572265625, -20.361083984375, -19.6064453125, -18.851806640625, -18.09716796875, -17.342529296875, -16.587890625, -15.833251953125, -15.07861328125, -14.323974609375, -13.5693359375, -12.814697265625, -12.06005859375, -11.305419921875, -10.55078125, -9.796142578125, -9.04150390625, -8.286865234375, -7.5322265625, -6.777587890625, -6.02294921875, -5.268310546875, -4.513671875, -3.759033203125, -3.00439453125, -2.249755859375, -1.4951171875, -0.740478515625, 0.01416015625, 0.768798828125, 1.5234375, 2.278076171875, 3.03271484375, 3.787353515625, 4.5419921875, 5.296630859375, 6.05126953125, 6.805908203125, 7.560546875, 8.315185546875, 9.06982421875, 9.824462890625, 10.5791015625, 11.333740234375, 12.08837890625, 12.843017578125, 13.59765625, 14.352294921875, 15.10693359375, 15.861572265625, 16.6162109375, 17.370849609375, 18.12548828125, 18.880126953125, 19.634765625, 20.389404296875, 21.14404296875, 21.898681640625, 22.6533203125, 23.407958984375, 24.16259765625, 24.917236328125, 25.671875]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 0.0, 4.0, 5.0, 6.0, 5.0, 11.0, 8.0, 11.0, 20.0, 17.0, 19.0, 30.0, 33.0, 33.0, 48.0, 56.0, 77.0, 105.0, 129.0, 208.0, 290.0, 418.0, 1036.0, 4476.0, 171414.0, 3999284.0, 12866.0, 1808.0, 595.0, 347.0, 215.0, 148.0, 129.0, 98.0, 64.0, 47.0, 33.0, 39.0, 28.0, 22.0, 23.0, 9.0, 13.0, 8.0, 13.0, 8.0, 9.0, 5.0, 3.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0], "bins": [-207.125, -200.701171875, -194.27734375, -187.853515625, -181.4296875, -175.005859375, -168.58203125, -162.158203125, -155.734375, -149.310546875, -142.88671875, -136.462890625, -130.0390625, -123.615234375, -117.19140625, -110.767578125, -104.34375, -97.919921875, -91.49609375, -85.072265625, -78.6484375, -72.224609375, -65.80078125, -59.376953125, -52.953125, -46.529296875, -40.10546875, -33.681640625, -27.2578125, -20.833984375, -14.41015625, -7.986328125, -1.5625, 4.861328125, 11.28515625, 17.708984375, 24.1328125, 30.556640625, 36.98046875, 43.404296875, 49.828125, 56.251953125, 62.67578125, 69.099609375, 75.5234375, 81.947265625, 88.37109375, 94.794921875, 101.21875, 107.642578125, 114.06640625, 120.490234375, 126.9140625, 133.337890625, 139.76171875, 146.185546875, 152.609375, 159.033203125, 165.45703125, 171.880859375, 178.3046875, 184.728515625, 191.15234375, 197.576171875, 204.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 7.0, 5.0, 3.0, 8.0, 8.0, 13.0, 18.0, 15.0, 25.0, 33.0, 40.0, 96.0, 165.0, 328.0, 750.0, 1046.0, 662.0, 353.0, 159.0, 101.0, 65.0, 49.0, 35.0, 23.0, 22.0, 10.0, 11.0, 5.0, 4.0, 5.0, 2.0, 1.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.34375, -40.8544921875, -39.365234375, -37.8759765625, -36.38671875, -34.8974609375, -33.408203125, -31.9189453125, -30.4296875, -28.9404296875, -27.451171875, -25.9619140625, -24.47265625, -22.9833984375, -21.494140625, -20.0048828125, -18.515625, -17.0263671875, -15.537109375, -14.0478515625, -12.55859375, -11.0693359375, -9.580078125, -8.0908203125, -6.6015625, -5.1123046875, -3.623046875, -2.1337890625, -0.64453125, 0.8447265625, 2.333984375, 3.8232421875, 5.3125, 6.8017578125, 8.291015625, 9.7802734375, 11.26953125, 12.7587890625, 14.248046875, 15.7373046875, 17.2265625, 18.7158203125, 20.205078125, 21.6943359375, 23.18359375, 24.6728515625, 26.162109375, 27.6513671875, 29.140625, 30.6298828125, 32.119140625, 33.6083984375, 35.09765625, 36.5869140625, 38.076171875, 39.5654296875, 41.0546875, 42.5439453125, 44.033203125, 45.5224609375, 47.01171875, 48.5009765625, 49.990234375, 51.4794921875, 52.96875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 5.0, 5.0, 15.0, 19.0, 17.0, 26.0, 36.0, 40.0, 44.0, 67.0, 155.0, 312.0, 807.0, 2198.0, 8347.0, 56817.0, 3766321.0, 332140.0, 20424.0, 4113.0, 1256.0, 503.0, 235.0, 115.0, 64.0, 48.0, 31.0, 24.0, 14.0, 8.0, 18.0, 16.0, 9.0, 3.0, 6.0, 6.0, 5.0, 3.0, 6.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-102.1875, -98.3681640625, -94.548828125, -90.7294921875, -86.91015625, -83.0908203125, -79.271484375, -75.4521484375, -71.6328125, -67.8134765625, -63.994140625, -60.1748046875, -56.35546875, -52.5361328125, -48.716796875, -44.8974609375, -41.078125, -37.2587890625, -33.439453125, -29.6201171875, -25.80078125, -21.9814453125, -18.162109375, -14.3427734375, -10.5234375, -6.7041015625, -2.884765625, 0.9345703125, 4.75390625, 8.5732421875, 12.392578125, 16.2119140625, 20.03125, 23.8505859375, 27.669921875, 31.4892578125, 35.30859375, 39.1279296875, 42.947265625, 46.7666015625, 50.5859375, 54.4052734375, 58.224609375, 62.0439453125, 65.86328125, 69.6826171875, 73.501953125, 77.3212890625, 81.140625, 84.9599609375, 88.779296875, 92.5986328125, 96.41796875, 100.2373046875, 104.056640625, 107.8759765625, 111.6953125, 115.5146484375, 119.333984375, 123.1533203125, 126.97265625, 130.7919921875, 134.611328125, 138.4306640625, 142.25]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 8.0, 38.0, 145.0, 540.0, 212.0, 60.0, 9.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-955.600341796875, -938.401123046875, -921.2019653320312, -904.0027465820312, -886.8035278320312, -869.6043090820312, -852.4051513671875, -835.2059326171875, -818.0067138671875, -800.8074951171875, -783.6083374023438, -766.4091186523438, -749.2098999023438, -732.0106811523438, -714.8115234375, -697.6123046875, -680.4130859375, -663.2138671875, -646.0147094726562, -628.8154907226562, -611.6162719726562, -594.4170532226562, -577.2178955078125, -560.0186767578125, -542.8195190429688, -525.6203002929688, -508.4211120605469, -491.221923828125, -474.022705078125, -456.8235168457031, -439.62432861328125, -422.42510986328125, -405.22589111328125, -388.0267028808594, -370.8274841308594, -353.6282958984375, -336.4290771484375, -319.2298889160156, -302.03070068359375, -284.83148193359375, -267.6322937011719, -250.43309020996094, -233.23388671875, -216.03469848632812, -198.83547973632812, -181.63629150390625, -164.4370880126953, -147.23788452148438, -130.03868103027344, -112.8394775390625, -95.64027404785156, -78.44107818603516, -61.24187469482422, -44.04267120361328, -26.843475341796875, -9.644271850585938, 7.554931640625, 24.754133224487305, 41.95333480834961, 59.15253448486328, 76.35173797607422, 93.55094146728516, 110.75013732910156, 127.9493408203125, 145.14854431152344]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 7.0, 3.0, 8.0, 2.0, 8.0, 6.0, 20.0, 23.0, 17.0, 20.0, 12.0, 20.0, 24.0, 36.0, 29.0, 18.0, 35.0, 25.0, 46.0, 52.0, 40.0, 51.0, 37.0, 54.0, 33.0, 42.0, 44.0, 37.0, 16.0, 35.0, 29.0, 28.0, 19.0, 24.0, 19.0, 10.0, 15.0, 20.0, 10.0, 4.0, 11.0, 9.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.85477447509766, -109.0417251586914, -105.22867584228516, -101.4156265258789, -97.60256958007812, -93.78952026367188, -89.97647094726562, -86.16342163085938, -82.35037231445312, -78.53732299804688, -74.72427368164062, -70.91122436523438, -67.09817504882812, -63.28512191772461, -59.472068786621094, -55.659019470214844, -51.845970153808594, -48.032920837402344, -44.219871520996094, -40.40681838989258, -36.59376907348633, -32.78071975708008, -28.967668533325195, -25.154617309570312, -21.341567993164062, -17.528518676757812, -13.71546745300293, -9.902417182922363, -6.089366912841797, -2.276317596435547, 1.536733627319336, 5.349784851074219, 9.162841796875, 12.975892066955566, 16.788942337036133, 20.601993560791016, 24.415042877197266, 28.228092193603516, 32.04114532470703, 35.85419464111328, 39.66724395751953, 43.48029327392578, 47.29334259033203, 51.10639572143555, 54.9194450378418, 58.73249435424805, 62.54554748535156, 66.35859680175781, 70.17164611816406, 73.98469543457031, 77.79774475097656, 81.61079406738281, 85.42384338378906, 89.23689270019531, 93.0499496459961, 96.86299896240234, 100.6760482788086, 104.48909759521484, 108.3021469116211, 112.11519622802734, 115.92825317382812, 119.74130249023438, 123.55435180664062, 127.36740112304688, 131.18045043945312]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 10.0, 6.0, 12.0, 14.0, 15.0, 16.0, 14.0, 16.0, 22.0, 19.0, 33.0, 16.0, 30.0, 25.0, 34.0, 49.0, 27.0, 46.0, 33.0, 46.0, 46.0, 42.0, 38.0, 41.0, 40.0, 30.0, 35.0, 38.0, 27.0, 30.0, 22.0, 20.0, 15.0, 9.0, 18.0, 22.0, 8.0, 6.0, 4.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.609375, -22.83251953125, -22.0556640625, -21.27880859375, -20.501953125, -19.72509765625, -18.9482421875, -18.17138671875, -17.39453125, -16.61767578125, -15.8408203125, -15.06396484375, -14.287109375, -13.51025390625, -12.7333984375, -11.95654296875, -11.1796875, -10.40283203125, -9.6259765625, -8.84912109375, -8.072265625, -7.29541015625, -6.5185546875, -5.74169921875, -4.96484375, -4.18798828125, -3.4111328125, -2.63427734375, -1.857421875, -1.08056640625, -0.3037109375, 0.47314453125, 1.25, 2.02685546875, 2.8037109375, 3.58056640625, 4.357421875, 5.13427734375, 5.9111328125, 6.68798828125, 7.46484375, 8.24169921875, 9.0185546875, 9.79541015625, 10.572265625, 11.34912109375, 12.1259765625, 12.90283203125, 13.6796875, 14.45654296875, 15.2333984375, 16.01025390625, 16.787109375, 17.56396484375, 18.3408203125, 19.11767578125, 19.89453125, 20.67138671875, 21.4482421875, 22.22509765625, 23.001953125, 23.77880859375, 24.5556640625, 25.33251953125, 26.109375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 8.0, 10.0, 7.0, 18.0, 15.0, 27.0, 41.0, 69.0, 103.0, 154.0, 207.0, 296.0, 427.0, 670.0, 980.0, 1528.0, 2260.0, 3552.0, 5327.0, 8741.0, 13845.0, 23045.0, 37683.0, 64852.0, 124476.0, 265234.0, 236167.0, 109858.0, 58350.0, 34519.0, 20746.0, 12822.0, 7855.0, 5017.0, 3223.0, 2191.0, 1407.0, 898.0, 600.0, 418.0, 288.0, 200.0, 123.0, 109.0, 69.0, 30.0, 36.0, 18.0, 12.0, 10.0, 10.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.447265625, -2.370574951171875, -2.29388427734375, -2.217193603515625, -2.1405029296875, -2.063812255859375, -1.98712158203125, -1.910430908203125, -1.833740234375, -1.757049560546875, -1.68035888671875, -1.603668212890625, -1.5269775390625, -1.450286865234375, -1.37359619140625, -1.296905517578125, -1.22021484375, -1.143524169921875, -1.06683349609375, -0.990142822265625, -0.9134521484375, -0.836761474609375, -0.76007080078125, -0.683380126953125, -0.606689453125, -0.529998779296875, -0.45330810546875, -0.376617431640625, -0.2999267578125, -0.223236083984375, -0.14654541015625, -0.069854736328125, 0.0068359375, 0.083526611328125, 0.16021728515625, 0.236907958984375, 0.3135986328125, 0.390289306640625, 0.46697998046875, 0.543670654296875, 0.620361328125, 0.697052001953125, 0.77374267578125, 0.850433349609375, 0.9271240234375, 1.003814697265625, 1.08050537109375, 1.157196044921875, 1.23388671875, 1.310577392578125, 1.38726806640625, 1.463958740234375, 1.5406494140625, 1.617340087890625, 1.69403076171875, 1.770721435546875, 1.847412109375, 1.924102783203125, 2.00079345703125, 2.077484130859375, 2.1541748046875, 2.230865478515625, 2.30755615234375, 2.384246826171875, 2.4609375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 5.0, 7.0, 9.0, 6.0, 11.0, 17.0, 23.0, 12.0, 14.0, 15.0, 27.0, 31.0, 27.0, 32.0, 36.0, 27.0, 41.0, 38.0, 44.0, 41.0, 1069.0, 28.0, 41.0, 36.0, 41.0, 37.0, 35.0, 37.0, 34.0, 25.0, 25.0, 25.0, 17.0, 18.0, 16.0, 20.0, 8.0, 5.0, 8.0, 8.0, 13.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.640625, -15.1483154296875, -14.656005859375, -14.1636962890625, -13.67138671875, -13.1790771484375, -12.686767578125, -12.1944580078125, -11.7021484375, -11.2098388671875, -10.717529296875, -10.2252197265625, -9.73291015625, -9.2406005859375, -8.748291015625, -8.2559814453125, -7.763671875, -7.2713623046875, -6.779052734375, -6.2867431640625, -5.79443359375, -5.3021240234375, -4.809814453125, -4.3175048828125, -3.8251953125, -3.3328857421875, -2.840576171875, -2.3482666015625, -1.85595703125, -1.3636474609375, -0.871337890625, -0.3790283203125, 0.11328125, 0.6055908203125, 1.097900390625, 1.5902099609375, 2.08251953125, 2.5748291015625, 3.067138671875, 3.5594482421875, 4.0517578125, 4.5440673828125, 5.036376953125, 5.5286865234375, 6.02099609375, 6.5133056640625, 7.005615234375, 7.4979248046875, 7.990234375, 8.4825439453125, 8.974853515625, 9.4671630859375, 9.95947265625, 10.4517822265625, 10.944091796875, 11.4364013671875, 11.9287109375, 12.4210205078125, 12.913330078125, 13.4056396484375, 13.89794921875, 14.3902587890625, 14.882568359375, 15.3748779296875, 15.8671875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 5.0, 12.0, 19.0, 16.0, 32.0, 49.0, 57.0, 83.0, 144.0, 223.0, 347.0, 507.0, 897.0, 1455.0, 2305.0, 4041.0, 6478.0, 11059.0, 18888.0, 33855.0, 63586.0, 130392.0, 1346746.0, 245081.0, 107422.0, 53756.0, 29091.0, 16397.0, 9550.0, 5700.0, 3504.0, 2087.0, 1213.0, 809.0, 454.0, 295.0, 197.0, 128.0, 76.0, 58.0, 44.0, 28.0, 11.0, 12.0, 11.0, 9.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.765625, -2.681488037109375, -2.59735107421875, -2.513214111328125, -2.4290771484375, -2.344940185546875, -2.26080322265625, -2.176666259765625, -2.092529296875, -2.008392333984375, -1.92425537109375, -1.840118408203125, -1.7559814453125, -1.671844482421875, -1.58770751953125, -1.503570556640625, -1.41943359375, -1.335296630859375, -1.25115966796875, -1.167022705078125, -1.0828857421875, -0.998748779296875, -0.91461181640625, -0.830474853515625, -0.746337890625, -0.662200927734375, -0.57806396484375, -0.493927001953125, -0.4097900390625, -0.325653076171875, -0.24151611328125, -0.157379150390625, -0.0732421875, 0.010894775390625, 0.09503173828125, 0.179168701171875, 0.2633056640625, 0.347442626953125, 0.43157958984375, 0.515716552734375, 0.599853515625, 0.683990478515625, 0.76812744140625, 0.852264404296875, 0.9364013671875, 1.020538330078125, 1.10467529296875, 1.188812255859375, 1.27294921875, 1.357086181640625, 1.44122314453125, 1.525360107421875, 1.6094970703125, 1.693634033203125, 1.77777099609375, 1.861907958984375, 1.946044921875, 2.030181884765625, 2.11431884765625, 2.198455810546875, 2.2825927734375, 2.366729736328125, 2.45086669921875, 2.535003662109375, 2.619140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 8.0, 3.0, 6.0, 7.0, 7.0, 13.0, 14.0, 20.0, 16.0, 22.0, 22.0, 25.0, 28.0, 34.0, 47.0, 50.0, 52.0, 44.0, 51.0, 50.0, 45.0, 43.0, 47.0, 50.0, 39.0, 34.0, 24.0, 37.0, 18.0, 28.0, 24.0, 20.0, 14.0, 8.0, 7.0, 5.0, 11.0, 5.0, 3.0, 4.0, 6.0, 2.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.004741668701171875, -0.004607468843460083, -0.004473268985748291, -0.004339069128036499, -0.004204869270324707, -0.004070669412612915, -0.003936469554901123, -0.003802269697189331, -0.003668069839477539, -0.003533869981765747, -0.003399670124053955, -0.003265470266342163, -0.003131270408630371, -0.002997070550918579, -0.002862870693206787, -0.002728670835494995, -0.002594470977783203, -0.002460271120071411, -0.002326071262359619, -0.002191871404647827, -0.002057671546936035, -0.0019234716892242432, -0.0017892718315124512, -0.0016550719738006592, -0.0015208721160888672, -0.0013866722583770752, -0.0012524724006652832, -0.0011182725429534912, -0.0009840726852416992, -0.0008498728275299072, -0.0007156729698181152, -0.0005814731121063232, -0.00044727325439453125, -0.00031307339668273926, -0.00017887353897094727, -4.4673681259155273e-05, 8.952617645263672e-05, 0.0002237260341644287, 0.0003579258918762207, 0.0004921257495880127, 0.0006263256072998047, 0.0007605254650115967, 0.0008947253227233887, 0.0010289251804351807, 0.0011631250381469727, 0.0012973248958587646, 0.0014315247535705566, 0.0015657246112823486, 0.0016999244689941406, 0.0018341243267059326, 0.0019683241844177246, 0.0021025240421295166, 0.0022367238998413086, 0.0023709237575531006, 0.0025051236152648926, 0.0026393234729766846, 0.0027735233306884766, 0.0029077231884002686, 0.0030419230461120605, 0.0031761229038238525, 0.0033103227615356445, 0.0034445226192474365, 0.0035787224769592285, 0.0037129223346710205, 0.0038471221923828125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 2.0, 10.0, 4.0, 5.0, 5.0, 8.0, 7.0, 15.0, 15.0, 18.0, 19.0, 25.0, 36.0, 57.0, 49.0, 70.0, 77.0, 105.0, 136.0, 216.0, 310.0, 522.0, 1305.0, 24391.0, 987351.0, 30773.0, 1334.0, 540.0, 343.0, 197.0, 134.0, 89.0, 72.0, 67.0, 44.0, 51.0, 29.0, 27.0, 25.0, 11.0, 11.0, 16.0, 9.0, 5.0, 9.0, 7.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.07550048828125, -0.07302665710449219, -0.07055282592773438, -0.06807899475097656, -0.06560516357421875, -0.06313133239746094, -0.060657501220703125, -0.05818367004394531, -0.0557098388671875, -0.05323600769042969, -0.050762176513671875, -0.04828834533691406, -0.04581451416015625, -0.04334068298339844, -0.040866851806640625, -0.03839302062988281, -0.035919189453125, -0.03344535827636719, -0.030971527099609375, -0.028497695922851562, -0.02602386474609375, -0.023550033569335938, -0.021076202392578125, -0.018602371215820312, -0.0161285400390625, -0.013654708862304688, -0.011180877685546875, -0.008707046508789062, -0.00623321533203125, -0.0037593841552734375, -0.001285552978515625, 0.0011882781982421875, 0.003662109375, 0.0061359405517578125, 0.008609771728515625, 0.011083602905273438, 0.01355743408203125, 0.016031265258789062, 0.018505096435546875, 0.020978927612304688, 0.0234527587890625, 0.025926589965820312, 0.028400421142578125, 0.030874252319335938, 0.03334808349609375, 0.03582191467285156, 0.038295745849609375, 0.04076957702636719, 0.043243408203125, 0.04571723937988281, 0.048191070556640625, 0.05066490173339844, 0.05313873291015625, 0.05561256408691406, 0.058086395263671875, 0.06056022644042969, 0.0630340576171875, 0.06550788879394531, 0.06798171997070312, 0.07045555114746094, 0.07292938232421875, 0.07540321350097656, 0.07787704467773438, 0.08035087585449219, 0.08282470703125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 9.0, 50.0, 411.0, 459.0, 79.0, 10.0], "bins": [-0.03447018191218376, -0.033905837684869766, -0.03334149345755577, -0.032777149230241776, -0.03221280500292778, -0.031648457050323486, -0.03108411468565464, -0.030519770458340645, -0.0299554243683815, -0.029391080141067505, -0.02882673591375351, -0.028262389823794365, -0.02769804559648037, -0.027133701369166374, -0.02656935714185238, -0.026005012914538383, -0.025440668687224388, -0.024876324459910393, -0.024311980232596397, -0.023747634142637253, -0.023183289915323257, -0.022618945688009262, -0.022054601460695267, -0.02149025723338127, -0.020925913006067276, -0.02036156877875328, -0.019797224551439285, -0.01923287846148014, -0.018668534234166145, -0.01810419000685215, -0.017539845779538155, -0.01697550155222416, -0.016411153599619865, -0.01584680937230587, -0.0152824642136693, -0.014718119986355305, -0.014153774827718735, -0.01358943060040474, -0.013025086373090744, -0.012460742145776749, -0.011896397918462753, -0.011332053691148758, -0.010767708532512188, -0.010203364305198193, -0.009639019146561623, -0.009074674919247627, -0.008510330691933632, -0.007945986464619637, -0.007381640840321779, -0.006817296147346497, -0.006252951920032501, -0.0056886072270572186, -0.005124262534081936, -0.004559917841106653, -0.0039955731481313705, -0.003431228920817375, -0.0028668842278420925, -0.00230253953486681, -0.0017381950747221708, -0.00117385049816221, -0.0006095059216022491, -4.5161228626966476e-05, 0.0005191832315176725, 0.0010835276916623116, 0.0016478722682222724]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 2.0, 4.0, 5.0, 7.0, 7.0, 9.0, 10.0, 18.0, 22.0, 14.0, 25.0, 20.0, 25.0, 32.0, 31.0, 34.0, 30.0, 47.0, 39.0, 46.0, 47.0, 43.0, 46.0, 37.0, 35.0, 37.0, 47.0, 25.0, 36.0, 39.0, 36.0, 24.0, 24.0, 26.0, 8.0, 16.0, 12.0, 5.0, 10.0, 6.0, 6.0, 1.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0027129650115966797, -0.0026272041723132133, -0.002541443333029747, -0.0024556824937462807, -0.0023699216544628143, -0.002284160815179348, -0.0021983999758958817, -0.0021126391366124153, -0.002026878297328949, -0.0019411174580454826, -0.0018553566187620163, -0.00176959577947855, -0.0016838349401950836, -0.0015980741009116173, -0.001512313261628151, -0.0014265524223446846, -0.0013407915830612183, -0.001255030743777752, -0.0011692699044942856, -0.0010835090652108192, -0.000997748225927353, -0.0009119873866438866, -0.0008262265473604202, -0.0007404657080769539, -0.0006547048687934875, -0.0005689440295100212, -0.00048318319022655487, -0.00039742235094308853, -0.0003116615116596222, -0.00022590067237615585, -0.00014013983309268951, -5.4378993809223175e-05, 3.1381845474243164e-05, 0.0001171426847577095, 0.00020290352404117584, 0.0002886643633246422, 0.0003744252026081085, 0.00046018604189157486, 0.0005459468811750412, 0.0006317077204585075, 0.0007174685597419739, 0.0008032293990254402, 0.0008889902383089066, 0.0009747510775923729, 0.0010605119168758392, 0.0011462727561593056, 0.001232033595442772, 0.0013177944347262383, 0.0014035552740097046, 0.001489316113293171, 0.0015750769525766373, 0.0016608377918601036, 0.00174659863114357, 0.0018323594704270363, 0.0019181203097105026, 0.002003881148993969, 0.0020896419882774353, 0.0021754028275609016, 0.002261163666844368, 0.0023469245061278343, 0.0024326853454113007, 0.002518446184694767, 0.0026042070239782333, 0.0026899678632616997, 0.002775728702545166]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 10.0, 6.0, 12.0, 14.0, 15.0, 16.0, 14.0, 16.0, 22.0, 19.0, 33.0, 16.0, 30.0, 25.0, 34.0, 49.0, 27.0, 46.0, 33.0, 46.0, 46.0, 42.0, 38.0, 41.0, 40.0, 30.0, 35.0, 38.0, 27.0, 30.0, 22.0, 20.0, 15.0, 9.0, 18.0, 22.0, 8.0, 6.0, 4.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-23.609375, -22.83251953125, -22.0556640625, -21.27880859375, -20.501953125, -19.72509765625, -18.9482421875, -18.17138671875, -17.39453125, -16.61767578125, -15.8408203125, -15.06396484375, -14.287109375, -13.51025390625, -12.7333984375, -11.95654296875, -11.1796875, -10.40283203125, -9.6259765625, -8.84912109375, -8.072265625, -7.29541015625, -6.5185546875, -5.74169921875, -4.96484375, -4.18798828125, -3.4111328125, -2.63427734375, -1.857421875, -1.08056640625, -0.3037109375, 0.47314453125, 1.25, 2.02685546875, 2.8037109375, 3.58056640625, 4.357421875, 5.13427734375, 5.9111328125, 6.68798828125, 7.46484375, 8.24169921875, 9.0185546875, 9.79541015625, 10.572265625, 11.34912109375, 12.1259765625, 12.90283203125, 13.6796875, 14.45654296875, 15.2333984375, 16.01025390625, 16.787109375, 17.56396484375, 18.3408203125, 19.11767578125, 19.89453125, 20.67138671875, 21.4482421875, 22.22509765625, 23.001953125, 23.77880859375, 24.5556640625, 25.33251953125, 26.109375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 2.0, 5.0, 3.0, 10.0, 10.0, 12.0, 19.0, 30.0, 41.0, 51.0, 81.0, 104.0, 134.0, 201.0, 235.0, 336.0, 445.0, 558.0, 761.0, 1017.0, 1384.0, 1933.0, 3234.0, 5620.0, 11589.0, 31051.0, 124471.0, 582503.0, 205500.0, 43544.0, 15193.0, 6690.0, 3675.0, 2159.0, 1546.0, 1096.0, 865.0, 665.0, 462.0, 366.0, 248.0, 178.0, 133.0, 100.0, 86.0, 56.0, 43.0, 38.0, 16.0, 19.0, 13.0, 7.0, 10.0, 4.0, 6.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.125, -35.87255859375, -34.6201171875, -33.36767578125, -32.115234375, -30.86279296875, -29.6103515625, -28.35791015625, -27.10546875, -25.85302734375, -24.6005859375, -23.34814453125, -22.095703125, -20.84326171875, -19.5908203125, -18.33837890625, -17.0859375, -15.83349609375, -14.5810546875, -13.32861328125, -12.076171875, -10.82373046875, -9.5712890625, -8.31884765625, -7.06640625, -5.81396484375, -4.5615234375, -3.30908203125, -2.056640625, -0.80419921875, 0.4482421875, 1.70068359375, 2.953125, 4.20556640625, 5.4580078125, 6.71044921875, 7.962890625, 9.21533203125, 10.4677734375, 11.72021484375, 12.97265625, 14.22509765625, 15.4775390625, 16.72998046875, 17.982421875, 19.23486328125, 20.4873046875, 21.73974609375, 22.9921875, 24.24462890625, 25.4970703125, 26.74951171875, 28.001953125, 29.25439453125, 30.5068359375, 31.75927734375, 33.01171875, 34.26416015625, 35.5166015625, 36.76904296875, 38.021484375, 39.27392578125, 40.5263671875, 41.77880859375, 43.03125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 2.0, 1.0, 4.0, 2.0, 2.0, 6.0, 6.0, 12.0, 4.0, 9.0, 16.0, 20.0, 21.0, 27.0, 27.0, 29.0, 43.0, 38.0, 59.0, 59.0, 87.0, 138.0, 1596.0, 315.0, 105.0, 78.0, 47.0, 43.0, 50.0, 38.0, 31.0, 31.0, 22.0, 22.0, 11.0, 16.0, 10.0, 7.0, 8.0, 4.0, 6.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.6875, -52.57421875, -50.4609375, -48.34765625, -46.234375, -44.12109375, -42.0078125, -39.89453125, -37.78125, -35.66796875, -33.5546875, -31.44140625, -29.328125, -27.21484375, -25.1015625, -22.98828125, -20.875, -18.76171875, -16.6484375, -14.53515625, -12.421875, -10.30859375, -8.1953125, -6.08203125, -3.96875, -1.85546875, 0.2578125, 2.37109375, 4.484375, 6.59765625, 8.7109375, 10.82421875, 12.9375, 15.05078125, 17.1640625, 19.27734375, 21.390625, 23.50390625, 25.6171875, 27.73046875, 29.84375, 31.95703125, 34.0703125, 36.18359375, 38.296875, 40.41015625, 42.5234375, 44.63671875, 46.75, 48.86328125, 50.9765625, 53.08984375, 55.203125, 57.31640625, 59.4296875, 61.54296875, 63.65625, 65.76953125, 67.8828125, 69.99609375, 72.109375, 74.22265625, 76.3359375, 78.44921875, 80.5625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 12.0, 10.0, 13.0, 15.0, 16.0, 30.0, 50.0, 58.0, 108.0, 183.0, 391.0, 1195.0, 152328.0, 2988508.0, 1683.0, 502.0, 209.0, 122.0, 77.0, 59.0, 30.0, 27.0, 20.0, 7.0, 13.0, 11.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-333.25, -323.1796875, -313.109375, -303.0390625, -292.96875, -282.8984375, -272.828125, -262.7578125, -252.6875, -242.6171875, -232.546875, -222.4765625, -212.40625, -202.3359375, -192.265625, -182.1953125, -172.125, -162.0546875, -151.984375, -141.9140625, -131.84375, -121.7734375, -111.703125, -101.6328125, -91.5625, -81.4921875, -71.421875, -61.3515625, -51.28125, -41.2109375, -31.140625, -21.0703125, -11.0, -0.9296875, 9.140625, 19.2109375, 29.28125, 39.3515625, 49.421875, 59.4921875, 69.5625, 79.6328125, 89.703125, 99.7734375, 109.84375, 119.9140625, 129.984375, 140.0546875, 150.125, 160.1953125, 170.265625, 180.3359375, 190.40625, 200.4765625, 210.546875, 220.6171875, 230.6875, 240.7578125, 250.828125, 260.8984375, 270.96875, 281.0390625, 291.109375, 301.1796875, 311.25]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 32.0, 365.0, 528.0, 77.0, 10.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.27427673339844, -112.36537170410156, -98.45646667480469, -84.54755401611328, -70.6386489868164, -56.72974395751953, -42.820831298828125, -28.91192626953125, -15.003021240234375, -1.0941143035888672, 12.81479263305664, 26.72370147705078, 40.632606506347656, 54.54151153564453, 68.45042419433594, 82.35932922363281, 96.26823425292969, 110.17713928222656, 124.08604431152344, 137.99496459960938, 151.90386962890625, 165.81277465820312, 179.7216796875, 193.63058471679688, 207.53948974609375, 221.44839477539062, 235.3572998046875, 249.26620483398438, 263.17510986328125, 277.0840148925781, 290.992919921875, 304.90185546875, 318.81072998046875, 332.7196350097656, 346.6285400390625, 360.5374450683594, 374.44635009765625, 388.3552551269531, 402.26416015625, 416.173095703125, 430.08197021484375, 443.9908752441406, 457.8997802734375, 471.8086853027344, 485.71759033203125, 499.6264953613281, 513.535400390625, 527.4443359375, 541.353271484375, 555.26220703125, 569.1710815429688, 583.0800170898438, 596.9888916015625, 610.8978271484375, 624.8067016601562, 638.7156372070312, 652.62451171875, 666.533447265625, 680.4423217773438, 694.3512573242188, 708.2601318359375, 722.1690673828125, 736.0779418945312, 749.9868774414062, 763.895751953125]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 9.0, 5.0, 13.0, 10.0, 16.0, 15.0, 18.0, 23.0, 30.0, 26.0, 28.0, 28.0, 35.0, 35.0, 48.0, 40.0, 40.0, 54.0, 56.0, 40.0, 52.0, 33.0, 34.0, 32.0, 37.0, 31.0, 31.0, 27.0, 23.0, 14.0, 21.0, 14.0, 18.0, 13.0, 10.0, 9.0, 10.0, 5.0, 5.0, 0.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-152.06520080566406, -146.97637939453125, -141.8875732421875, -136.7987518310547, -131.70993041992188, -126.6211166381836, -121.53230285644531, -116.4434814453125, -111.35466766357422, -106.26585388183594, -101.17703247070312, -96.08821868896484, -90.99940490722656, -85.91058349609375, -80.82176971435547, -75.73295593261719, -70.64413452148438, -65.5553207397461, -60.46649932861328, -55.377685546875, -50.28886795043945, -45.200050354003906, -40.111236572265625, -35.02241897583008, -29.93360137939453, -24.844783782958984, -19.75596809387207, -14.66715145111084, -9.57833480834961, -4.4895172119140625, 0.5992984771728516, 5.688114166259766, 10.776947021484375, 15.865763664245605, 20.954580307006836, 26.04339599609375, 31.132213592529297, 36.221031188964844, 41.309844970703125, 46.39866256713867, 51.48748016357422, 56.576297760009766, 61.66511535644531, 66.7539291381836, 71.84274291992188, 76.93156433105469, 82.02037811279297, 87.10919189453125, 92.19801330566406, 97.28682708740234, 102.37564849853516, 107.46446228027344, 112.55328369140625, 117.64209747314453, 122.73091125488281, 127.81973266601562, 132.90853881835938, 137.9973602294922, 143.08616638183594, 148.17498779296875, 153.26380920410156, 158.35263061523438, 163.44143676757812, 168.53025817871094, 173.61907958984375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 2.0, 1.0, 10.0, 9.0, 9.0, 7.0, 8.0, 18.0, 11.0, 10.0, 11.0, 20.0, 28.0, 26.0, 19.0, 33.0, 22.0, 28.0, 27.0, 42.0, 32.0, 39.0, 38.0, 40.0, 42.0, 39.0, 35.0, 53.0, 40.0, 31.0, 26.0, 16.0, 20.0, 23.0, 22.0, 24.0, 22.0, 21.0, 18.0, 11.0, 12.0, 16.0, 10.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.546875, -18.833251953125, -18.11962890625, -17.406005859375, -16.6923828125, -15.978759765625, -15.26513671875, -14.551513671875, -13.837890625, -13.124267578125, -12.41064453125, -11.697021484375, -10.9833984375, -10.269775390625, -9.55615234375, -8.842529296875, -8.12890625, -7.415283203125, -6.70166015625, -5.988037109375, -5.2744140625, -4.560791015625, -3.84716796875, -3.133544921875, -2.419921875, -1.706298828125, -0.99267578125, -0.279052734375, 0.4345703125, 1.148193359375, 1.86181640625, 2.575439453125, 3.2890625, 4.002685546875, 4.71630859375, 5.429931640625, 6.1435546875, 6.857177734375, 7.57080078125, 8.284423828125, 8.998046875, 9.711669921875, 10.42529296875, 11.138916015625, 11.8525390625, 12.566162109375, 13.27978515625, 13.993408203125, 14.70703125, 15.420654296875, 16.13427734375, 16.847900390625, 17.5615234375, 18.275146484375, 18.98876953125, 19.702392578125, 20.416015625, 21.129638671875, 21.84326171875, 22.556884765625, 23.2705078125, 23.984130859375, 24.69775390625, 25.411376953125, 26.125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 10.0, 4.0, 8.0, 16.0, 19.0, 17.0, 30.0, 52.0, 69.0, 69.0, 165.0, 204.0, 302.0, 411.0, 642.0, 933.0, 1536.0, 2661.0, 5080.0, 11923.0, 50867.0, 371605.0, 2179794.0, 1334869.0, 190191.0, 24571.0, 8266.0, 3994.0, 2118.0, 1311.0, 812.0, 539.0, 389.0, 219.0, 180.0, 112.0, 95.0, 62.0, 43.0, 40.0, 22.0, 8.0, 11.0, 8.0, 2.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-47.25, -45.8935546875, -44.537109375, -43.1806640625, -41.82421875, -40.4677734375, -39.111328125, -37.7548828125, -36.3984375, -35.0419921875, -33.685546875, -32.3291015625, -30.97265625, -29.6162109375, -28.259765625, -26.9033203125, -25.546875, -24.1904296875, -22.833984375, -21.4775390625, -20.12109375, -18.7646484375, -17.408203125, -16.0517578125, -14.6953125, -13.3388671875, -11.982421875, -10.6259765625, -9.26953125, -7.9130859375, -6.556640625, -5.2001953125, -3.84375, -2.4873046875, -1.130859375, 0.2255859375, 1.58203125, 2.9384765625, 4.294921875, 5.6513671875, 7.0078125, 8.3642578125, 9.720703125, 11.0771484375, 12.43359375, 13.7900390625, 15.146484375, 16.5029296875, 17.859375, 19.2158203125, 20.572265625, 21.9287109375, 23.28515625, 24.6416015625, 25.998046875, 27.3544921875, 28.7109375, 30.0673828125, 31.423828125, 32.7802734375, 34.13671875, 35.4931640625, 36.849609375, 38.2060546875, 39.5625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 8.0, 9.0, 12.0, 13.0, 31.0, 40.0, 45.0, 76.0, 121.0, 200.0, 375.0, 645.0, 925.0, 642.0, 390.0, 186.0, 117.0, 72.0, 51.0, 25.0, 16.0, 23.0, 7.0, 11.0, 7.0, 3.0, 9.0, 4.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.15625, -42.35107421875, -40.5458984375, -38.74072265625, -36.935546875, -35.13037109375, -33.3251953125, -31.52001953125, -29.71484375, -27.90966796875, -26.1044921875, -24.29931640625, -22.494140625, -20.68896484375, -18.8837890625, -17.07861328125, -15.2734375, -13.46826171875, -11.6630859375, -9.85791015625, -8.052734375, -6.24755859375, -4.4423828125, -2.63720703125, -0.83203125, 0.97314453125, 2.7783203125, 4.58349609375, 6.388671875, 8.19384765625, 9.9990234375, 11.80419921875, 13.609375, 15.41455078125, 17.2197265625, 19.02490234375, 20.830078125, 22.63525390625, 24.4404296875, 26.24560546875, 28.05078125, 29.85595703125, 31.6611328125, 33.46630859375, 35.271484375, 37.07666015625, 38.8818359375, 40.68701171875, 42.4921875, 44.29736328125, 46.1025390625, 47.90771484375, 49.712890625, 51.51806640625, 53.3232421875, 55.12841796875, 56.93359375, 58.73876953125, 60.5439453125, 62.34912109375, 64.154296875, 65.95947265625, 67.7646484375, 69.56982421875, 71.375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 4.0, 9.0, 13.0, 21.0, 27.0, 43.0, 53.0, 118.0, 217.0, 477.0, 998.0, 2757.0, 9097.0, 45796.0, 1299275.0, 2758559.0, 60408.0, 10884.0, 3261.0, 1156.0, 488.0, 263.0, 141.0, 81.0, 47.0, 34.0, 17.0, 12.0, 7.0, 2.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-114.5, -111.4921875, -108.484375, -105.4765625, -102.46875, -99.4609375, -96.453125, -93.4453125, -90.4375, -87.4296875, -84.421875, -81.4140625, -78.40625, -75.3984375, -72.390625, -69.3828125, -66.375, -63.3671875, -60.359375, -57.3515625, -54.34375, -51.3359375, -48.328125, -45.3203125, -42.3125, -39.3046875, -36.296875, -33.2890625, -30.28125, -27.2734375, -24.265625, -21.2578125, -18.25, -15.2421875, -12.234375, -9.2265625, -6.21875, -3.2109375, -0.203125, 2.8046875, 5.8125, 8.8203125, 11.828125, 14.8359375, 17.84375, 20.8515625, 23.859375, 26.8671875, 29.875, 32.8828125, 35.890625, 38.8984375, 41.90625, 44.9140625, 47.921875, 50.9296875, 53.9375, 56.9453125, 59.953125, 62.9609375, 65.96875, 68.9765625, 71.984375, 74.9921875, 78.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 243.0, 755.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2434.56640625, -2376.829833984375, -2319.093505859375, -2261.35693359375, -2203.620361328125, -2145.8837890625, -2088.1474609375, -2030.410888671875, -1972.6744384765625, -1914.93798828125, -1857.201416015625, -1799.4649658203125, -1741.728515625, -1683.991943359375, -1626.2554931640625, -1568.51904296875, -1510.782470703125, -1453.0460205078125, -1395.3094482421875, -1337.572998046875, -1279.83642578125, -1222.0999755859375, -1164.363525390625, -1106.626953125, -1048.8905029296875, -991.1539916992188, -933.41748046875, -875.6810302734375, -817.9445190429688, -760.2080078125, -702.4715576171875, -644.7350463867188, -586.99853515625, -529.2620239257812, -471.5255432128906, -413.7890625, -356.05255126953125, -298.3160400390625, -240.57955932617188, -182.84307861328125, -125.1065673828125, -67.37007141113281, -9.633575439453125, 48.10292053222656, 105.83941650390625, 163.575927734375, 221.31240844726562, 279.04888916015625, 336.785400390625, 394.52191162109375, 452.2583923339844, 509.994873046875, 567.7313842773438, 625.4678955078125, 683.204345703125, 740.9408569335938, 798.6773681640625, 856.4138793945312, 914.150390625, 971.8868408203125, 1029.623291015625, 1087.35986328125, 1145.0963134765625, 1202.832763671875, 1260.5693359375]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 6.0, 7.0, 13.0, 10.0, 11.0, 12.0, 15.0, 17.0, 25.0, 30.0, 28.0, 37.0, 36.0, 27.0, 40.0, 46.0, 49.0, 49.0, 37.0, 45.0, 49.0, 51.0, 46.0, 47.0, 42.0, 42.0, 27.0, 31.0, 24.0, 32.0, 16.0, 18.0, 9.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-147.3984832763672, -142.49415588378906, -137.58982849121094, -132.68551635742188, -127.78118896484375, -122.87686157226562, -117.9725341796875, -113.06820678710938, -108.16388702392578, -103.25955963134766, -98.35523986816406, -93.45091247558594, -88.54658508300781, -83.64226531982422, -78.7379379272461, -73.8336181640625, -68.92929077148438, -64.02496337890625, -59.120643615722656, -54.21631622314453, -49.31199264526367, -44.40766906738281, -39.50334167480469, -34.59901809692383, -29.69469451904297, -24.79037094116211, -19.886045455932617, -14.981720924377441, -10.077396392822266, -5.173072814941406, -0.26874732971191406, 4.635578155517578, 9.539886474609375, 14.44421100616455, 19.348535537719727, 24.25286102294922, 29.157184600830078, 34.06150817871094, 38.96583557128906, 43.87015914916992, 48.77448272705078, 53.67880630493164, 58.5831298828125, 63.487457275390625, 68.39178466796875, 73.29610443115234, 78.20043182373047, 83.10475158691406, 88.00907897949219, 92.91340637207031, 97.8177261352539, 102.72205352783203, 107.62637329101562, 112.53070068359375, 117.43502807617188, 122.33935546875, 127.2436752319336, 132.1479949951172, 137.0523223876953, 141.95664978027344, 146.86097717285156, 151.76528930664062, 156.66961669921875, 161.57394409179688, 166.478271484375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 8.0, 5.0, 5.0, 12.0, 4.0, 7.0, 8.0, 7.0, 20.0, 16.0, 13.0, 19.0, 22.0, 28.0, 31.0, 22.0, 27.0, 29.0, 27.0, 39.0, 35.0, 32.0, 47.0, 39.0, 43.0, 43.0, 35.0, 48.0, 29.0, 37.0, 31.0, 33.0, 25.0, 21.0, 23.0, 22.0, 17.0, 14.0, 14.0, 10.0, 14.0, 5.0, 10.0, 10.0, 2.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.05615234375, -15.4560546875, -14.85595703125, -14.255859375, -13.65576171875, -13.0556640625, -12.45556640625, -11.85546875, -11.25537109375, -10.6552734375, -10.05517578125, -9.455078125, -8.85498046875, -8.2548828125, -7.65478515625, -7.0546875, -6.45458984375, -5.8544921875, -5.25439453125, -4.654296875, -4.05419921875, -3.4541015625, -2.85400390625, -2.25390625, -1.65380859375, -1.0537109375, -0.45361328125, 0.146484375, 0.74658203125, 1.3466796875, 1.94677734375, 2.546875, 3.14697265625, 3.7470703125, 4.34716796875, 4.947265625, 5.54736328125, 6.1474609375, 6.74755859375, 7.34765625, 7.94775390625, 8.5478515625, 9.14794921875, 9.748046875, 10.34814453125, 10.9482421875, 11.54833984375, 12.1484375, 12.74853515625, 13.3486328125, 13.94873046875, 14.548828125, 15.14892578125, 15.7490234375, 16.34912109375, 16.94921875, 17.54931640625, 18.1494140625, 18.74951171875, 19.349609375, 19.94970703125, 20.5498046875, 21.14990234375, 21.75]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 4.0, 7.0, 16.0, 27.0, 25.0, 42.0, 51.0, 77.0, 107.0, 165.0, 245.0, 435.0, 577.0, 831.0, 1260.0, 1894.0, 2729.0, 4209.0, 6249.0, 9558.0, 14857.0, 23105.0, 38696.0, 66369.0, 120035.0, 236799.0, 233038.0, 117979.0, 65183.0, 38167.0, 23316.0, 14303.0, 9448.0, 6241.0, 4077.0, 2762.0, 1807.0, 1212.0, 875.0, 634.0, 382.0, 267.0, 162.0, 98.0, 78.0, 46.0, 37.0, 26.0, 26.0, 6.0, 7.0, 4.0, 5.0, 5.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7138671875, -1.6547393798828125, -1.595611572265625, -1.5364837646484375, -1.47735595703125, -1.4182281494140625, -1.359100341796875, -1.2999725341796875, -1.2408447265625, -1.1817169189453125, -1.122589111328125, -1.0634613037109375, -1.00433349609375, -0.9452056884765625, -0.886077880859375, -0.8269500732421875, -0.767822265625, -0.7086944580078125, -0.649566650390625, -0.5904388427734375, -0.53131103515625, -0.4721832275390625, -0.413055419921875, -0.3539276123046875, -0.2947998046875, -0.2356719970703125, -0.176544189453125, -0.1174163818359375, -0.05828857421875, 0.0008392333984375, 0.059967041015625, 0.1190948486328125, 0.17822265625, 0.2373504638671875, 0.296478271484375, 0.3556060791015625, 0.41473388671875, 0.4738616943359375, 0.532989501953125, 0.5921173095703125, 0.6512451171875, 0.7103729248046875, 0.769500732421875, 0.8286285400390625, 0.88775634765625, 0.9468841552734375, 1.006011962890625, 1.0651397705078125, 1.124267578125, 1.1833953857421875, 1.242523193359375, 1.3016510009765625, 1.36077880859375, 1.4199066162109375, 1.479034423828125, 1.5381622314453125, 1.5972900390625, 1.6564178466796875, 1.715545654296875, 1.7746734619140625, 1.83380126953125, 1.8929290771484375, 1.952056884765625, 2.0111846923828125, 2.0703125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 3.0, 5.0, 7.0, 7.0, 5.0, 10.0, 9.0, 17.0, 11.0, 19.0, 24.0, 14.0, 26.0, 25.0, 29.0, 34.0, 36.0, 41.0, 40.0, 44.0, 48.0, 31.0, 1058.0, 35.0, 39.0, 37.0, 28.0, 44.0, 37.0, 28.0, 29.0, 29.0, 23.0, 17.0, 18.0, 24.0, 16.0, 13.0, 14.0, 9.0, 11.0, 6.0, 5.0, 5.0, 5.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.4765625, -11.0953369140625, -10.714111328125, -10.3328857421875, -9.95166015625, -9.5704345703125, -9.189208984375, -8.8079833984375, -8.4267578125, -8.0455322265625, -7.664306640625, -7.2830810546875, -6.90185546875, -6.5206298828125, -6.139404296875, -5.7581787109375, -5.376953125, -4.9957275390625, -4.614501953125, -4.2332763671875, -3.85205078125, -3.4708251953125, -3.089599609375, -2.7083740234375, -2.3271484375, -1.9459228515625, -1.564697265625, -1.1834716796875, -0.80224609375, -0.4210205078125, -0.039794921875, 0.3414306640625, 0.72265625, 1.1038818359375, 1.485107421875, 1.8663330078125, 2.24755859375, 2.6287841796875, 3.010009765625, 3.3912353515625, 3.7724609375, 4.1536865234375, 4.534912109375, 4.9161376953125, 5.29736328125, 5.6785888671875, 6.059814453125, 6.4410400390625, 6.822265625, 7.2034912109375, 7.584716796875, 7.9659423828125, 8.34716796875, 8.7283935546875, 9.109619140625, 9.4908447265625, 9.8720703125, 10.2532958984375, 10.634521484375, 11.0157470703125, 11.39697265625, 11.7781982421875, 12.159423828125, 12.5406494140625, 12.921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 9.0, 9.0, 8.0, 21.0, 21.0, 38.0, 44.0, 66.0, 107.0, 152.0, 243.0, 334.0, 549.0, 853.0, 1289.0, 2236.0, 3667.0, 5778.0, 9813.0, 16856.0, 29351.0, 52945.0, 102857.0, 238073.0, 1350347.0, 131682.0, 64689.0, 35221.0, 19874.0, 11692.0, 7143.0, 4139.0, 2574.0, 1584.0, 1045.0, 639.0, 417.0, 259.0, 168.0, 112.0, 69.0, 48.0, 30.0, 30.0, 21.0, 8.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.017578125, -1.95068359375, -1.8837890625, -1.81689453125, -1.75, -1.68310546875, -1.6162109375, -1.54931640625, -1.482421875, -1.41552734375, -1.3486328125, -1.28173828125, -1.21484375, -1.14794921875, -1.0810546875, -1.01416015625, -0.947265625, -0.88037109375, -0.8134765625, -0.74658203125, -0.6796875, -0.61279296875, -0.5458984375, -0.47900390625, -0.412109375, -0.34521484375, -0.2783203125, -0.21142578125, -0.14453125, -0.07763671875, -0.0107421875, 0.05615234375, 0.123046875, 0.18994140625, 0.2568359375, 0.32373046875, 0.390625, 0.45751953125, 0.5244140625, 0.59130859375, 0.658203125, 0.72509765625, 0.7919921875, 0.85888671875, 0.92578125, 0.99267578125, 1.0595703125, 1.12646484375, 1.193359375, 1.26025390625, 1.3271484375, 1.39404296875, 1.4609375, 1.52783203125, 1.5947265625, 1.66162109375, 1.728515625, 1.79541015625, 1.8623046875, 1.92919921875, 1.99609375, 2.06298828125, 2.1298828125, 2.19677734375, 2.263671875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 4.0, 5.0, 6.0, 7.0, 9.0, 12.0, 14.0, 11.0, 13.0, 20.0, 16.0, 23.0, 33.0, 33.0, 24.0, 55.0, 44.0, 47.0, 59.0, 51.0, 45.0, 38.0, 53.0, 43.0, 30.0, 37.0, 29.0, 31.0, 34.0, 26.0, 31.0, 19.0, 15.0, 20.0, 13.0, 7.0, 9.0, 5.0, 6.0, 5.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.003932952880859375, -0.0038109421730041504, -0.0036889314651489258, -0.003566920757293701, -0.0034449100494384766, -0.003322899341583252, -0.0032008886337280273, -0.0030788779258728027, -0.002956867218017578, -0.0028348565101623535, -0.002712845802307129, -0.0025908350944519043, -0.0024688243865966797, -0.002346813678741455, -0.0022248029708862305, -0.002102792263031006, -0.0019807815551757812, -0.0018587708473205566, -0.001736760139465332, -0.0016147494316101074, -0.0014927387237548828, -0.0013707280158996582, -0.0012487173080444336, -0.001126706600189209, -0.0010046958923339844, -0.0008826851844787598, -0.0007606744766235352, -0.0006386637687683105, -0.0005166530609130859, -0.00039464235305786133, -0.0002726316452026367, -0.0001506209373474121, -2.86102294921875e-05, 9.340047836303711e-05, 0.00021541118621826172, 0.00033742189407348633, 0.00045943260192871094, 0.0005814433097839355, 0.0007034540176391602, 0.0008254647254943848, 0.0009474754333496094, 0.001069486141204834, 0.0011914968490600586, 0.0013135075569152832, 0.0014355182647705078, 0.0015575289726257324, 0.001679539680480957, 0.0018015503883361816, 0.0019235610961914062, 0.002045571804046631, 0.0021675825119018555, 0.00228959321975708, 0.0024116039276123047, 0.0025336146354675293, 0.002655625343322754, 0.0027776360511779785, 0.002899646759033203, 0.0030216574668884277, 0.0031436681747436523, 0.003265678882598877, 0.0033876895904541016, 0.003509700298309326, 0.0036317110061645508, 0.0037537217140197754, 0.003875732421875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 2.0, 5.0, 6.0, 7.0, 7.0, 9.0, 11.0, 18.0, 25.0, 25.0, 34.0, 49.0, 53.0, 76.0, 101.0, 118.0, 173.0, 274.0, 412.0, 882.0, 9199.0, 989516.0, 44837.0, 1165.0, 503.0, 333.0, 161.0, 148.0, 88.0, 62.0, 47.0, 38.0, 32.0, 33.0, 22.0, 9.0, 17.0, 13.0, 7.0, 11.0, 9.0, 2.0, 4.0, 6.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08612060546875, -0.08348274230957031, -0.08084487915039062, -0.07820701599121094, -0.07556915283203125, -0.07293128967285156, -0.07029342651367188, -0.06765556335449219, -0.0650177001953125, -0.06237983703613281, -0.059741973876953125, -0.05710411071777344, -0.05446624755859375, -0.05182838439941406, -0.049190521240234375, -0.04655265808105469, -0.043914794921875, -0.04127693176269531, -0.038639068603515625, -0.03600120544433594, -0.03336334228515625, -0.030725479125976562, -0.028087615966796875, -0.025449752807617188, -0.0228118896484375, -0.020174026489257812, -0.017536163330078125, -0.014898300170898438, -0.01226043701171875, -0.009622573852539062, -0.006984710693359375, -0.0043468475341796875, -0.001708984375, 0.0009288787841796875, 0.003566741943359375, 0.0062046051025390625, 0.00884246826171875, 0.011480331420898438, 0.014118194580078125, 0.016756057739257812, 0.0193939208984375, 0.022031784057617188, 0.024669647216796875, 0.027307510375976562, 0.02994537353515625, 0.03258323669433594, 0.035221099853515625, 0.03785896301269531, 0.040496826171875, 0.04313468933105469, 0.045772552490234375, 0.04841041564941406, 0.05104827880859375, 0.05368614196777344, 0.056324005126953125, 0.05896186828613281, 0.0615997314453125, 0.06423759460449219, 0.06687545776367188, 0.06951332092285156, 0.07215118408203125, 0.07478904724121094, 0.07742691040039062, 0.08006477355957031, 0.08270263671875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 19.0, 84.0, 199.0, 371.0, 225.0, 79.0, 25.0, 7.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017735612345859408, -0.0015005156164988875, -0.001227470114827156, -0.0009544244967401028, -0.0006813788786530495, -0.00040833326056599617, -0.0001352877588942647, 0.0001377578591927886, 0.0004108034772798419, 0.0006838490953668952, 0.0009568946552462876, 0.00122994021512568, 0.0015029858332127333, 0.0017760314512997866, 0.002049076836556196, 0.0023221224546432495, 0.002595168072730303, 0.002868213690817356, 0.0031412593089044094, 0.0034143049269914627, 0.003687350545078516, 0.003960396163165569, 0.004233441315591335, 0.004506487399339676, 0.004779533017426729, 0.0050525786355137825, 0.005325624253600836, 0.005598669871687889, 0.005871715489774942, 0.006144761107861996, 0.006417806260287762, 0.006690852344036102, 0.006963898427784443, 0.007236944045871496, 0.0075099896639585495, 0.007783035282045603, 0.008056080900132656, 0.008329126052558422, 0.008602172136306763, 0.008875217288732529, 0.00914826337248087, 0.009421308524906635, 0.009694354608654976, 0.009967399761080742, 0.010240445844829082, 0.010513490997254848, 0.010786537081003189, 0.011059582233428955, 0.011332627385854721, 0.011605672538280487, 0.011878718622028828, 0.012151763774454594, 0.012424809858202934, 0.0126978550106287, 0.01297090109437704, 0.013243946246802807, 0.013516992330551147, 0.013790037482976913, 0.014063083566725254, 0.01433612871915102, 0.01460917480289936, 0.014882219955325127, 0.015155266039073467, 0.015428311191499233, 0.015701357275247574]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 14.0, 11.0, 13.0, 14.0, 20.0, 18.0, 36.0, 25.0, 33.0, 41.0, 31.0, 39.0, 51.0, 39.0, 34.0, 36.0, 29.0, 49.0, 46.0, 42.0, 42.0, 38.0, 30.0, 36.0, 24.0, 19.0, 19.0, 29.0, 19.0, 17.0, 14.0, 15.0, 12.0, 9.0, 9.0, 8.0, 5.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002568185329437256, -0.002489631064236164, -0.0024110767990350723, -0.0023325225338339806, -0.002253968268632889, -0.002175414003431797, -0.0020968597382307053, -0.0020183054730296135, -0.0019397512078285217, -0.00186119694262743, -0.0017826426774263382, -0.0017040884122252464, -0.0016255341470241547, -0.001546979881823063, -0.0014684256166219711, -0.0013898713514208794, -0.0013113170862197876, -0.0012327628210186958, -0.001154208555817604, -0.0010756542906165123, -0.0009971000254154205, -0.0009185457602143288, -0.000839991495013237, -0.0007614372298121452, -0.0006828829646110535, -0.0006043286994099617, -0.0005257744342088699, -0.00044722016900777817, -0.0003686659038066864, -0.00029011163860559464, -0.00021155737340450287, -0.0001330031082034111, -5.4448843002319336e-05, 2.410542219877243e-05, 0.0001026596873998642, 0.00018121395260095596, 0.00025976821780204773, 0.0003383224830031395, 0.00041687674820423126, 0.000495431013405323, 0.0005739852786064148, 0.0006525395438075066, 0.0007310938090085983, 0.0008096480742096901, 0.0008882023394107819, 0.0009667566046118736, 0.0010453108698129654, 0.0011238651350140572, 0.001202419400215149, 0.0012809736654162407, 0.0013595279306173325, 0.0014380821958184242, 0.001516636461019516, 0.0015951907262206078, 0.0016737449914216995, 0.0017522992566227913, 0.001830853521823883, 0.0019094077870249748, 0.0019879620522260666, 0.0020665163174271584, 0.00214507058262825, 0.002223624847829342, 0.0023021791130304337, 0.0023807333782315254, 0.002459287643432617]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 3.0, 8.0, 5.0, 5.0, 12.0, 4.0, 7.0, 8.0, 7.0, 20.0, 16.0, 13.0, 19.0, 22.0, 28.0, 31.0, 22.0, 27.0, 29.0, 27.0, 39.0, 35.0, 32.0, 47.0, 39.0, 43.0, 44.0, 34.0, 48.0, 29.0, 37.0, 31.0, 33.0, 25.0, 21.0, 23.0, 22.0, 17.0, 14.0, 14.0, 10.0, 14.0, 5.0, 10.0, 10.0, 2.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.65625, -16.05615234375, -15.4560546875, -14.85595703125, -14.255859375, -13.65576171875, -13.0556640625, -12.45556640625, -11.85546875, -11.25537109375, -10.6552734375, -10.05517578125, -9.455078125, -8.85498046875, -8.2548828125, -7.65478515625, -7.0546875, -6.45458984375, -5.8544921875, -5.25439453125, -4.654296875, -4.05419921875, -3.4541015625, -2.85400390625, -2.25390625, -1.65380859375, -1.0537109375, -0.45361328125, 0.146484375, 0.74658203125, 1.3466796875, 1.94677734375, 2.546875, 3.14697265625, 3.7470703125, 4.34716796875, 4.947265625, 5.54736328125, 6.1474609375, 6.74755859375, 7.34765625, 7.94775390625, 8.5478515625, 9.14794921875, 9.748046875, 10.34814453125, 10.9482421875, 11.54833984375, 12.1484375, 12.74853515625, 13.3486328125, 13.94873046875, 14.548828125, 15.14892578125, 15.7490234375, 16.34912109375, 16.94921875, 17.54931640625, 18.1494140625, 18.74951171875, 19.349609375, 19.94970703125, 20.5498046875, 21.14990234375, 21.75]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 3.0, 3.0, 15.0, 11.0, 21.0, 24.0, 39.0, 31.0, 46.0, 71.0, 100.0, 128.0, 207.0, 281.0, 430.0, 579.0, 839.0, 1275.0, 1949.0, 3427.0, 6456.0, 17380.0, 77205.0, 634590.0, 244686.0, 35975.0, 10514.0, 4590.0, 2647.0, 1607.0, 1014.0, 701.0, 496.0, 324.0, 248.0, 169.0, 144.0, 112.0, 56.0, 41.0, 35.0, 22.0, 15.0, 14.0, 13.0, 7.0, 8.0, 6.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-51.8125, -50.2314453125, -48.650390625, -47.0693359375, -45.48828125, -43.9072265625, -42.326171875, -40.7451171875, -39.1640625, -37.5830078125, -36.001953125, -34.4208984375, -32.83984375, -31.2587890625, -29.677734375, -28.0966796875, -26.515625, -24.9345703125, -23.353515625, -21.7724609375, -20.19140625, -18.6103515625, -17.029296875, -15.4482421875, -13.8671875, -12.2861328125, -10.705078125, -9.1240234375, -7.54296875, -5.9619140625, -4.380859375, -2.7998046875, -1.21875, 0.3623046875, 1.943359375, 3.5244140625, 5.10546875, 6.6865234375, 8.267578125, 9.8486328125, 11.4296875, 13.0107421875, 14.591796875, 16.1728515625, 17.75390625, 19.3349609375, 20.916015625, 22.4970703125, 24.078125, 25.6591796875, 27.240234375, 28.8212890625, 30.40234375, 31.9833984375, 33.564453125, 35.1455078125, 36.7265625, 38.3076171875, 39.888671875, 41.4697265625, 43.05078125, 44.6318359375, 46.212890625, 47.7939453125, 49.375]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 11.0, 9.0, 10.0, 13.0, 12.0, 20.0, 16.0, 16.0, 28.0, 23.0, 31.0, 36.0, 31.0, 25.0, 38.0, 47.0, 38.0, 78.0, 136.0, 1603.0, 329.0, 92.0, 75.0, 39.0, 35.0, 37.0, 34.0, 25.0, 28.0, 18.0, 22.0, 13.0, 9.0, 15.0, 15.0, 7.0, 4.0, 5.0, 6.0, 5.0, 1.0, 4.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.8125, -35.53466796875, -34.2568359375, -32.97900390625, -31.701171875, -30.42333984375, -29.1455078125, -27.86767578125, -26.58984375, -25.31201171875, -24.0341796875, -22.75634765625, -21.478515625, -20.20068359375, -18.9228515625, -17.64501953125, -16.3671875, -15.08935546875, -13.8115234375, -12.53369140625, -11.255859375, -9.97802734375, -8.7001953125, -7.42236328125, -6.14453125, -4.86669921875, -3.5888671875, -2.31103515625, -1.033203125, 0.24462890625, 1.5224609375, 2.80029296875, 4.078125, 5.35595703125, 6.6337890625, 7.91162109375, 9.189453125, 10.46728515625, 11.7451171875, 13.02294921875, 14.30078125, 15.57861328125, 16.8564453125, 18.13427734375, 19.412109375, 20.68994140625, 21.9677734375, 23.24560546875, 24.5234375, 25.80126953125, 27.0791015625, 28.35693359375, 29.634765625, 30.91259765625, 32.1904296875, 33.46826171875, 34.74609375, 36.02392578125, 37.3017578125, 38.57958984375, 39.857421875, 41.13525390625, 42.4130859375, 43.69091796875, 44.96875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 7.0, 3.0, 8.0, 8.0, 14.0, 21.0, 26.0, 47.0, 58.0, 111.0, 118.0, 254.0, 490.0, 1547.0, 56012.0, 3081220.0, 3896.0, 822.0, 340.0, 218.0, 141.0, 104.0, 53.0, 54.0, 37.0, 28.0, 12.0, 10.0, 8.0, 6.0, 6.0, 6.0, 6.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-162.0, -156.45703125, -150.9140625, -145.37109375, -139.828125, -134.28515625, -128.7421875, -123.19921875, -117.65625, -112.11328125, -106.5703125, -101.02734375, -95.484375, -89.94140625, -84.3984375, -78.85546875, -73.3125, -67.76953125, -62.2265625, -56.68359375, -51.140625, -45.59765625, -40.0546875, -34.51171875, -28.96875, -23.42578125, -17.8828125, -12.33984375, -6.796875, -1.25390625, 4.2890625, 9.83203125, 15.375, 20.91796875, 26.4609375, 32.00390625, 37.546875, 43.08984375, 48.6328125, 54.17578125, 59.71875, 65.26171875, 70.8046875, 76.34765625, 81.890625, 87.43359375, 92.9765625, 98.51953125, 104.0625, 109.60546875, 115.1484375, 120.69140625, 126.234375, 131.77734375, 137.3203125, 142.86328125, 148.40625, 153.94921875, 159.4921875, 165.03515625, 170.578125, 176.12109375, 181.6640625, 187.20703125, 192.75]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 11.0, 15.0, 29.0, 90.0, 178.0, 267.0, 217.0, 120.0, 48.0, 18.0, 15.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-308.1970520019531, -302.3411560058594, -296.4852294921875, -290.62933349609375, -284.7734375, -278.91754150390625, -273.0616149902344, -267.2057189941406, -261.3498229980469, -255.49391174316406, -249.6380157470703, -243.7821044921875, -237.92620849609375, -232.07029724121094, -226.21438598632812, -220.35848999023438, -214.50257873535156, -208.64666748046875, -202.790771484375, -196.9348602294922, -191.07896423339844, -185.22305297851562, -179.36715698242188, -173.51124572753906, -167.65533447265625, -161.79942321777344, -155.9435272216797, -150.08761596679688, -144.23171997070312, -138.3758087158203, -132.5198974609375, -126.66400146484375, -120.80809783935547, -114.95219421386719, -109.0962905883789, -103.24038696289062, -97.38447570800781, -91.52857971191406, -85.67266845703125, -79.81676483154297, -73.96086120605469, -68.1049575805664, -62.249053955078125, -56.39314651489258, -50.5372428894043, -44.681339263916016, -38.82543182373047, -32.96952819824219, -27.113624572753906, -21.257720947265625, -15.401815414428711, -9.545909881591797, -3.6900062561035156, 2.1658973693847656, 8.021804809570312, 13.877708435058594, 19.733612060546875, 25.589515686035156, 31.44542121887207, 37.301326751708984, 43.157230377197266, 49.01313400268555, 54.869041442871094, 60.724945068359375, 66.58084869384766]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 10.0, 10.0, 14.0, 11.0, 14.0, 20.0, 13.0, 26.0, 34.0, 39.0, 35.0, 39.0, 43.0, 48.0, 44.0, 45.0, 52.0, 70.0, 43.0, 45.0, 45.0, 64.0, 33.0, 44.0, 30.0, 20.0, 24.0, 23.0, 14.0, 9.0, 8.0, 8.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-163.85751342773438, -159.5406036376953, -155.22369384765625, -150.90679931640625, -146.5898895263672, -142.27297973632812, -137.95608520507812, -133.63917541503906, -129.322265625, -125.00535583496094, -120.6884536743164, -116.37155151367188, -112.05464172363281, -107.73773193359375, -103.42082977294922, -99.10392761230469, -94.78701782226562, -90.47010803222656, -86.15320587158203, -81.8363037109375, -77.51939392089844, -73.20248413085938, -68.88558197021484, -64.56867980957031, -60.25177001953125, -55.93486404418945, -51.617958068847656, -47.30105209350586, -42.98414611816406, -38.667240142822266, -34.35033416748047, -30.033428192138672, -25.716506958007812, -21.399600982666016, -17.08269500732422, -12.765789031982422, -8.448883056640625, -4.131977081298828, 0.18492889404296875, 4.501834869384766, 8.818740844726562, 13.13564682006836, 17.452552795410156, 21.769458770751953, 26.08636474609375, 30.403270721435547, 34.720176696777344, 39.03708267211914, 43.35398864746094, 47.670894622802734, 51.98780059814453, 56.30470657348633, 60.621612548828125, 64.93852233886719, 69.25542449951172, 73.57232666015625, 77.88923645019531, 82.20614624023438, 86.5230484008789, 90.83995056152344, 95.1568603515625, 99.47377014160156, 103.7906723022461, 108.10757446289062, 112.42448425292969]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 5.0, 7.0, 9.0, 12.0, 12.0, 22.0, 21.0, 18.0, 22.0, 18.0, 33.0, 26.0, 34.0, 25.0, 30.0, 35.0, 42.0, 34.0, 40.0, 55.0, 40.0, 39.0, 25.0, 38.0, 42.0, 31.0, 28.0, 38.0, 22.0, 25.0, 23.0, 16.0, 20.0, 14.0, 8.0, 12.0, 11.0, 16.0, 10.0, 9.0, 6.0, 4.0, 4.0, 1.0, 0.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.421875, -18.789794921875, -18.15771484375, -17.525634765625, -16.8935546875, -16.261474609375, -15.62939453125, -14.997314453125, -14.365234375, -13.733154296875, -13.10107421875, -12.468994140625, -11.8369140625, -11.204833984375, -10.57275390625, -9.940673828125, -9.30859375, -8.676513671875, -8.04443359375, -7.412353515625, -6.7802734375, -6.148193359375, -5.51611328125, -4.884033203125, -4.251953125, -3.619873046875, -2.98779296875, -2.355712890625, -1.7236328125, -1.091552734375, -0.45947265625, 0.172607421875, 0.8046875, 1.436767578125, 2.06884765625, 2.700927734375, 3.3330078125, 3.965087890625, 4.59716796875, 5.229248046875, 5.861328125, 6.493408203125, 7.12548828125, 7.757568359375, 8.3896484375, 9.021728515625, 9.65380859375, 10.285888671875, 10.91796875, 11.550048828125, 12.18212890625, 12.814208984375, 13.4462890625, 14.078369140625, 14.71044921875, 15.342529296875, 15.974609375, 16.606689453125, 17.23876953125, 17.870849609375, 18.5029296875, 19.135009765625, 19.76708984375, 20.399169921875, 21.03125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 13.0, 11.0, 16.0, 22.0, 37.0, 43.0, 67.0, 114.0, 116.0, 178.0, 318.0, 441.0, 709.0, 1096.0, 2033.0, 4005.0, 11302.0, 76306.0, 1234323.0, 2625920.0, 206749.0, 18457.0, 5639.0, 2506.0, 1353.0, 814.0, 544.0, 343.0, 230.0, 164.0, 124.0, 90.0, 64.0, 50.0, 20.0, 26.0, 10.0, 7.0, 6.0, 8.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.8125, -50.15087890625, -48.4892578125, -46.82763671875, -45.166015625, -43.50439453125, -41.8427734375, -40.18115234375, -38.51953125, -36.85791015625, -35.1962890625, -33.53466796875, -31.873046875, -30.21142578125, -28.5498046875, -26.88818359375, -25.2265625, -23.56494140625, -21.9033203125, -20.24169921875, -18.580078125, -16.91845703125, -15.2568359375, -13.59521484375, -11.93359375, -10.27197265625, -8.6103515625, -6.94873046875, -5.287109375, -3.62548828125, -1.9638671875, -0.30224609375, 1.359375, 3.02099609375, 4.6826171875, 6.34423828125, 8.005859375, 9.66748046875, 11.3291015625, 12.99072265625, 14.65234375, 16.31396484375, 17.9755859375, 19.63720703125, 21.298828125, 22.96044921875, 24.6220703125, 26.28369140625, 27.9453125, 29.60693359375, 31.2685546875, 32.93017578125, 34.591796875, 36.25341796875, 37.9150390625, 39.57666015625, 41.23828125, 42.89990234375, 44.5615234375, 46.22314453125, 47.884765625, 49.54638671875, 51.2080078125, 52.86962890625, 54.53125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 8.0, 14.0, 19.0, 30.0, 28.0, 54.0, 71.0, 124.0, 170.0, 253.0, 362.0, 585.0, 688.0, 569.0, 358.0, 200.0, 180.0, 92.0, 76.0, 38.0, 51.0, 28.0, 19.0, 11.0, 8.0, 8.0, 3.0, 2.0, 2.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.3125, -40.96728515625, -39.6220703125, -38.27685546875, -36.931640625, -35.58642578125, -34.2412109375, -32.89599609375, -31.55078125, -30.20556640625, -28.8603515625, -27.51513671875, -26.169921875, -24.82470703125, -23.4794921875, -22.13427734375, -20.7890625, -19.44384765625, -18.0986328125, -16.75341796875, -15.408203125, -14.06298828125, -12.7177734375, -11.37255859375, -10.02734375, -8.68212890625, -7.3369140625, -5.99169921875, -4.646484375, -3.30126953125, -1.9560546875, -0.61083984375, 0.734375, 2.07958984375, 3.4248046875, 4.77001953125, 6.115234375, 7.46044921875, 8.8056640625, 10.15087890625, 11.49609375, 12.84130859375, 14.1865234375, 15.53173828125, 16.876953125, 18.22216796875, 19.5673828125, 20.91259765625, 22.2578125, 23.60302734375, 24.9482421875, 26.29345703125, 27.638671875, 28.98388671875, 30.3291015625, 31.67431640625, 33.01953125, 34.36474609375, 35.7099609375, 37.05517578125, 38.400390625, 39.74560546875, 41.0908203125, 42.43603515625, 43.78125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 2.0, 3.0, 3.0, 4.0, 3.0, 8.0, 15.0, 24.0, 33.0, 43.0, 68.0, 105.0, 195.0, 412.0, 929.0, 3226.0, 23629.0, 2023338.0, 2112945.0, 24144.0, 3312.0, 938.0, 418.0, 178.0, 103.0, 75.0, 41.0, 27.0, 14.0, 14.0, 14.0, 4.0, 2.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.375, -107.12890625, -103.8828125, -100.63671875, -97.390625, -94.14453125, -90.8984375, -87.65234375, -84.40625, -81.16015625, -77.9140625, -74.66796875, -71.421875, -68.17578125, -64.9296875, -61.68359375, -58.4375, -55.19140625, -51.9453125, -48.69921875, -45.453125, -42.20703125, -38.9609375, -35.71484375, -32.46875, -29.22265625, -25.9765625, -22.73046875, -19.484375, -16.23828125, -12.9921875, -9.74609375, -6.5, -3.25390625, -0.0078125, 3.23828125, 6.484375, 9.73046875, 12.9765625, 16.22265625, 19.46875, 22.71484375, 25.9609375, 29.20703125, 32.453125, 35.69921875, 38.9453125, 42.19140625, 45.4375, 48.68359375, 51.9296875, 55.17578125, 58.421875, 61.66796875, 64.9140625, 68.16015625, 71.40625, 74.65234375, 77.8984375, 81.14453125, 84.390625, 87.63671875, 90.8828125, 94.12890625, 97.375]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 17.0, 29.0, 81.0, 159.0, 268.0, 202.0, 133.0, 53.0, 28.0, 20.0, 8.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-270.2859191894531, -262.02593994140625, -253.76596069335938, -245.5059814453125, -237.24598693847656, -228.9860076904297, -220.7260284423828, -212.46604919433594, -204.2060546875, -195.94607543945312, -187.68609619140625, -179.42611694335938, -171.16612243652344, -162.90614318847656, -154.6461639404297, -146.3861846923828, -138.12620544433594, -129.86622619628906, -121.60623931884766, -113.34626007080078, -105.08627319335938, -96.8262939453125, -88.56631469726562, -80.30633544921875, -72.04634857177734, -63.7863655090332, -55.52638244628906, -47.26640319824219, -39.00642013549805, -30.746437072753906, -22.48645782470703, -14.22647476196289, -5.96649169921875, 2.293490409851074, 10.553472518920898, 18.813453674316406, 27.073436737060547, 35.33341979980469, 43.59339904785156, 51.8533821105957, 60.113365173339844, 68.37334442138672, 76.63333129882812, 84.893310546875, 93.15328979492188, 101.41327667236328, 109.67325592041016, 117.93324279785156, 126.19322204589844, 134.4532012939453, 142.7131805419922, 150.97317504882812, 159.233154296875, 167.49313354492188, 175.75311279296875, 184.01309204101562, 192.2730712890625, 200.53305053710938, 208.79302978515625, 217.05300903320312, 225.31300354003906, 233.57298278808594, 241.8329620361328, 250.0929412841797, 258.3529357910156]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 2.0, 5.0, 7.0, 5.0, 17.0, 12.0, 13.0, 13.0, 30.0, 20.0, 24.0, 17.0, 35.0, 32.0, 39.0, 39.0, 49.0, 32.0, 42.0, 55.0, 48.0, 45.0, 39.0, 31.0, 41.0, 35.0, 31.0, 28.0, 28.0, 27.0, 35.0, 14.0, 30.0, 11.0, 17.0, 10.0, 14.0, 5.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.79100036621094, -125.490966796875, -121.19093322753906, -116.89090728759766, -112.59087371826172, -108.29084014892578, -103.99081420898438, -99.69078063964844, -95.3907470703125, -91.09071350097656, -86.79067993164062, -82.49065399169922, -78.19062042236328, -73.89058685302734, -69.59056091308594, -65.29052734375, -60.99049377441406, -56.690460205078125, -52.39043045043945, -48.09040069580078, -43.790367126464844, -39.490333557128906, -35.190303802490234, -30.89027214050293, -26.590240478515625, -22.29020881652832, -17.990177154541016, -13.690145492553711, -9.390113830566406, -5.090082168579102, -0.7900505065917969, 3.509981155395508, 7.810028076171875, 12.11005973815918, 16.410091400146484, 20.71012306213379, 25.010154724121094, 29.3101863861084, 33.6102180480957, 37.910247802734375, 42.21028137207031, 46.51031494140625, 50.81034469604492, 55.110374450683594, 59.41040802001953, 63.71044158935547, 68.01046752929688, 72.31050109863281, 76.61053466796875, 80.91056823730469, 85.21060180664062, 89.51062774658203, 93.81066131591797, 98.1106948852539, 102.41072082519531, 106.71075439453125, 111.01078796386719, 115.31082153320312, 119.61085510253906, 123.91088104248047, 128.21090698242188, 132.5109405517578, 136.81097412109375, 141.1110076904297, 145.41104125976562]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 6.0, 7.0, 7.0, 7.0, 11.0, 10.0, 17.0, 18.0, 20.0, 17.0, 22.0, 24.0, 25.0, 30.0, 23.0, 30.0, 37.0, 39.0, 33.0, 52.0, 35.0, 32.0, 41.0, 36.0, 35.0, 34.0, 36.0, 36.0, 24.0, 32.0, 31.0, 22.0, 29.0, 20.0, 24.0, 14.0, 12.0, 14.0, 9.0, 10.0, 3.0, 5.0, 8.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4921875, -14.9857177734375, -14.479248046875, -13.9727783203125, -13.46630859375, -12.9598388671875, -12.453369140625, -11.9468994140625, -11.4404296875, -10.9339599609375, -10.427490234375, -9.9210205078125, -9.41455078125, -8.9080810546875, -8.401611328125, -7.8951416015625, -7.388671875, -6.8822021484375, -6.375732421875, -5.8692626953125, -5.36279296875, -4.8563232421875, -4.349853515625, -3.8433837890625, -3.3369140625, -2.8304443359375, -2.323974609375, -1.8175048828125, -1.31103515625, -0.8045654296875, -0.298095703125, 0.2083740234375, 0.71484375, 1.2213134765625, 1.727783203125, 2.2342529296875, 2.74072265625, 3.2471923828125, 3.753662109375, 4.2601318359375, 4.7666015625, 5.2730712890625, 5.779541015625, 6.2860107421875, 6.79248046875, 7.2989501953125, 7.805419921875, 8.3118896484375, 8.818359375, 9.3248291015625, 9.831298828125, 10.3377685546875, 10.84423828125, 11.3507080078125, 11.857177734375, 12.3636474609375, 12.8701171875, 13.3765869140625, 13.883056640625, 14.3895263671875, 14.89599609375, 15.4024658203125, 15.908935546875, 16.4154052734375, 16.921875]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 3.0, 4.0, 9.0, 12.0, 12.0, 22.0, 23.0, 50.0, 60.0, 87.0, 122.0, 199.0, 258.0, 371.0, 507.0, 756.0, 996.0, 1399.0, 2065.0, 2916.0, 4088.0, 5825.0, 8123.0, 11659.0, 17075.0, 24687.0, 37112.0, 56677.0, 91388.0, 161462.0, 229021.0, 144953.0, 83531.0, 52436.0, 34477.0, 23125.0, 15852.0, 11061.0, 7693.0, 5376.0, 3794.0, 2727.0, 1938.0, 1369.0, 938.0, 667.0, 475.0, 356.0, 243.0, 152.0, 139.0, 91.0, 72.0, 37.0, 21.0, 20.0, 16.0, 10.0, 5.0, 4.0, 4.0, 0.0, 1.0], "bins": [-1.2998046875, -1.2584228515625, -1.217041015625, -1.1756591796875, -1.13427734375, -1.0928955078125, -1.051513671875, -1.0101318359375, -0.96875, -0.9273681640625, -0.885986328125, -0.8446044921875, -0.80322265625, -0.7618408203125, -0.720458984375, -0.6790771484375, -0.6376953125, -0.5963134765625, -0.554931640625, -0.5135498046875, -0.47216796875, -0.4307861328125, -0.389404296875, -0.3480224609375, -0.306640625, -0.2652587890625, -0.223876953125, -0.1824951171875, -0.14111328125, -0.0997314453125, -0.058349609375, -0.0169677734375, 0.0244140625, 0.0657958984375, 0.107177734375, 0.1485595703125, 0.18994140625, 0.2313232421875, 0.272705078125, 0.3140869140625, 0.35546875, 0.3968505859375, 0.438232421875, 0.4796142578125, 0.52099609375, 0.5623779296875, 0.603759765625, 0.6451416015625, 0.6865234375, 0.7279052734375, 0.769287109375, 0.8106689453125, 0.85205078125, 0.8934326171875, 0.934814453125, 0.9761962890625, 1.017578125, 1.0589599609375, 1.100341796875, 1.1417236328125, 1.18310546875, 1.2244873046875, 1.265869140625, 1.3072509765625, 1.3486328125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 8.0, 7.0, 9.0, 10.0, 6.0, 14.0, 22.0, 23.0, 22.0, 45.0, 32.0, 32.0, 48.0, 37.0, 53.0, 48.0, 53.0, 44.0, 1080.0, 58.0, 48.0, 39.0, 38.0, 36.0, 34.0, 44.0, 25.0, 27.0, 18.0, 16.0, 12.0, 10.0, 9.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5546875, -10.1361083984375, -9.717529296875, -9.2989501953125, -8.88037109375, -8.4617919921875, -8.043212890625, -7.6246337890625, -7.2060546875, -6.7874755859375, -6.368896484375, -5.9503173828125, -5.53173828125, -5.1131591796875, -4.694580078125, -4.2760009765625, -3.857421875, -3.4388427734375, -3.020263671875, -2.6016845703125, -2.18310546875, -1.7645263671875, -1.345947265625, -0.9273681640625, -0.5087890625, -0.0902099609375, 0.328369140625, 0.7469482421875, 1.16552734375, 1.5841064453125, 2.002685546875, 2.4212646484375, 2.83984375, 3.2584228515625, 3.677001953125, 4.0955810546875, 4.51416015625, 4.9327392578125, 5.351318359375, 5.7698974609375, 6.1884765625, 6.6070556640625, 7.025634765625, 7.4442138671875, 7.86279296875, 8.2813720703125, 8.699951171875, 9.1185302734375, 9.537109375, 9.9556884765625, 10.374267578125, 10.7928466796875, 11.21142578125, 11.6300048828125, 12.048583984375, 12.4671630859375, 12.8857421875, 13.3043212890625, 13.722900390625, 14.1414794921875, 14.56005859375, 14.9786376953125, 15.397216796875, 15.8157958984375, 16.234375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 3.0, 5.0, 10.0, 21.0, 24.0, 37.0, 43.0, 79.0, 104.0, 167.0, 243.0, 436.0, 696.0, 1080.0, 1900.0, 3215.0, 5544.0, 9536.0, 16964.0, 30921.0, 59311.0, 121199.0, 1258248.0, 342741.0, 117862.0, 57245.0, 30294.0, 16685.0, 9299.0, 5305.0, 3117.0, 1873.0, 1043.0, 664.0, 431.0, 256.0, 174.0, 120.0, 75.0, 51.0, 39.0, 25.0, 16.0, 9.0, 4.0, 8.0, 5.0, 3.0, 0.0, 0.0, 2.0, 3.0], "bins": [-2.103515625, -2.0433807373046875, -1.983245849609375, -1.9231109619140625, -1.86297607421875, -1.8028411865234375, -1.742706298828125, -1.6825714111328125, -1.6224365234375, -1.5623016357421875, -1.502166748046875, -1.4420318603515625, -1.38189697265625, -1.3217620849609375, -1.261627197265625, -1.2014923095703125, -1.141357421875, -1.0812225341796875, -1.021087646484375, -0.9609527587890625, -0.90081787109375, -0.8406829833984375, -0.780548095703125, -0.7204132080078125, -0.6602783203125, -0.6001434326171875, -0.540008544921875, -0.4798736572265625, -0.41973876953125, -0.3596038818359375, -0.299468994140625, -0.2393341064453125, -0.17919921875, -0.1190643310546875, -0.058929443359375, 0.0012054443359375, 0.06134033203125, 0.1214752197265625, 0.181610107421875, 0.2417449951171875, 0.3018798828125, 0.3620147705078125, 0.422149658203125, 0.4822845458984375, 0.54241943359375, 0.6025543212890625, 0.662689208984375, 0.7228240966796875, 0.782958984375, 0.8430938720703125, 0.903228759765625, 0.9633636474609375, 1.02349853515625, 1.0836334228515625, 1.143768310546875, 1.2039031982421875, 1.2640380859375, 1.3241729736328125, 1.384307861328125, 1.4444427490234375, 1.50457763671875, 1.5647125244140625, 1.624847412109375, 1.6849822998046875, 1.7451171875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 12.0, 14.0, 13.0, 34.0, 41.0, 49.0, 48.0, 74.0, 77.0, 75.0, 79.0, 77.0, 79.0, 67.0, 59.0, 42.0, 34.0, 27.0, 25.0, 23.0, 9.0, 10.0, 4.0, 7.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00557708740234375, -0.005415439605712891, -0.005253791809082031, -0.005092144012451172, -0.0049304962158203125, -0.004768848419189453, -0.004607200622558594, -0.004445552825927734, -0.004283905029296875, -0.004122257232666016, -0.003960609436035156, -0.003798961639404297, -0.0036373138427734375, -0.003475666046142578, -0.0033140182495117188, -0.0031523704528808594, -0.00299072265625, -0.0028290748596191406, -0.0026674270629882812, -0.002505779266357422, -0.0023441314697265625, -0.002182483673095703, -0.0020208358764648438, -0.0018591880798339844, -0.001697540283203125, -0.0015358924865722656, -0.0013742446899414062, -0.0012125968933105469, -0.0010509490966796875, -0.0008893013000488281, -0.0007276535034179688, -0.0005660057067871094, -0.00040435791015625, -0.00024271011352539062, -8.106231689453125e-05, 8.058547973632812e-05, 0.0002422332763671875, 0.0004038810729980469, 0.0005655288696289062, 0.0007271766662597656, 0.000888824462890625, 0.0010504722595214844, 0.0012121200561523438, 0.0013737678527832031, 0.0015354156494140625, 0.0016970634460449219, 0.0018587112426757812, 0.0020203590393066406, 0.0021820068359375, 0.0023436546325683594, 0.0025053024291992188, 0.002666950225830078, 0.0028285980224609375, 0.002990245819091797, 0.0031518936157226562, 0.0033135414123535156, 0.003475189208984375, 0.0036368370056152344, 0.0037984848022460938, 0.003960132598876953, 0.0041217803955078125, 0.004283428192138672, 0.004445075988769531, 0.004606723785400391, 0.00476837158203125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 10.0, 10.0, 17.0, 19.0, 27.0, 52.0, 62.0, 82.0, 116.0, 202.0, 319.0, 532.0, 1658.0, 947753.0, 95375.0, 1073.0, 489.0, 236.0, 156.0, 97.0, 79.0, 38.0, 42.0, 34.0, 19.0, 13.0, 17.0, 9.0, 6.0, 1.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0860595703125, -0.0831766128540039, -0.08029365539550781, -0.07741069793701172, -0.07452774047851562, -0.07164478302001953, -0.06876182556152344, -0.06587886810302734, -0.06299591064453125, -0.060112953186035156, -0.05722999572753906, -0.05434703826904297, -0.051464080810546875, -0.04858112335205078, -0.04569816589355469, -0.042815208435058594, -0.0399322509765625, -0.037049293518066406, -0.03416633605957031, -0.03128337860107422, -0.028400421142578125, -0.02551746368408203, -0.022634506225585938, -0.019751548767089844, -0.01686859130859375, -0.013985633850097656, -0.011102676391601562, -0.008219718933105469, -0.005336761474609375, -0.0024538040161132812, 0.0004291534423828125, 0.0033121109008789062, 0.006195068359375, 0.009078025817871094, 0.011960983276367188, 0.014843940734863281, 0.017726898193359375, 0.02060985565185547, 0.023492813110351562, 0.026375770568847656, 0.02925872802734375, 0.032141685485839844, 0.03502464294433594, 0.03790760040283203, 0.040790557861328125, 0.04367351531982422, 0.04655647277832031, 0.049439430236816406, 0.0523223876953125, 0.055205345153808594, 0.05808830261230469, 0.06097126007080078, 0.06385421752929688, 0.06673717498779297, 0.06962013244628906, 0.07250308990478516, 0.07538604736328125, 0.07826900482177734, 0.08115196228027344, 0.08403491973876953, 0.08691787719726562, 0.08980083465576172, 0.09268379211425781, 0.0955667495727539, 0.09844970703125]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 65.0, 793.0, 148.0, 6.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025228111073374748, -0.02468651533126831, -0.024144919589161873, -0.023603323847055435, -0.023061728104948997, -0.02252013236284256, -0.021978536620736122, -0.021436940878629684, -0.020895346999168396, -0.02035375125706196, -0.01981215551495552, -0.019270559772849083, -0.018728964030742645, -0.018187368288636208, -0.01764577254652977, -0.01710417866706848, -0.016562581062316895, -0.016020985320210457, -0.01547938957810402, -0.014937793835997581, -0.014396198093891144, -0.013854602351784706, -0.013313007541000843, -0.012771411798894405, -0.012229816056787968, -0.01168822031468153, -0.011146624572575092, -0.010605028830468655, -0.010063434019684792, -0.009521838277578354, -0.008980242535471916, -0.008438646793365479, -0.00789705291390419, -0.007355457171797752, -0.006813861429691315, -0.006272266153246164, -0.005730670411139727, -0.005189074669033289, -0.004647479392588139, -0.004105883650481701, -0.003564287908375263, -0.0030226921662688255, -0.0024810966569930315, -0.0019395010313019156, -0.0013979054056107998, -0.0008563096635043621, -0.0003147141542285681, 0.00022688135504722595, 0.0007684770971536636, 0.0013100727228447795, 0.0018516683485358953, 0.0023932638578116894, 0.002934859599918127, 0.0034764553420245647, 0.004018050618469715, 0.004559646360576153, 0.0051012421026825905, 0.005642837844789028, 0.006184433586895466, 0.006726028863340616, 0.007267624605447054, 0.007809220347553492, 0.008350815623998642, 0.00889241136610508, 0.009434007108211517]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 6.0, 4.0, 4.0, 5.0, 5.0, 9.0, 7.0, 8.0, 7.0, 12.0, 16.0, 20.0, 19.0, 19.0, 28.0, 29.0, 30.0, 33.0, 40.0, 28.0, 38.0, 46.0, 47.0, 44.0, 39.0, 41.0, 33.0, 43.0, 36.0, 29.0, 34.0, 33.0, 35.0, 19.0, 26.0, 22.0, 10.0, 21.0, 13.0, 14.0, 10.0, 12.0, 3.0, 7.0, 7.0, 4.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0017501115798950195, -0.001693863421678543, -0.0016376152634620667, -0.0015813671052455902, -0.0015251189470291138, -0.0014688707888126373, -0.0014126226305961609, -0.0013563744723796844, -0.001300126314163208, -0.0012438781559467316, -0.0011876299977302551, -0.0011313818395137787, -0.0010751336812973022, -0.0010188855230808258, -0.0009626373648643494, -0.0009063892066478729, -0.0008501410484313965, -0.00079389289021492, -0.0007376447319984436, -0.0006813965737819672, -0.0006251484155654907, -0.0005689002573490143, -0.0005126520991325378, -0.0004564039409160614, -0.00040015578269958496, -0.0003439076244831085, -0.0002876594662666321, -0.00023141130805015564, -0.0001751631498336792, -0.00011891499161720276, -6.266683340072632e-05, -6.418675184249878e-06, 4.982948303222656e-05, 0.000106077641248703, 0.00016232579946517944, 0.00021857395768165588, 0.0002748221158981323, 0.00033107027411460876, 0.0003873184323310852, 0.00044356659054756165, 0.0004998147487640381, 0.0005560629069805145, 0.000612311065196991, 0.0006685592234134674, 0.0007248073816299438, 0.0007810555398464203, 0.0008373036980628967, 0.0008935518562793732, 0.0009498000144958496, 0.001006048172712326, 0.0010622963309288025, 0.001118544489145279, 0.0011747926473617554, 0.0012310408055782318, 0.0012872889637947083, 0.0013435371220111847, 0.0013997852802276611, 0.0014560334384441376, 0.001512281596660614, 0.0015685297548770905, 0.001624777913093567, 0.0016810260713100433, 0.0017372742295265198, 0.0017935223877429962, 0.0018497705459594727]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 5.0, 6.0, 7.0, 7.0, 7.0, 11.0, 10.0, 17.0, 18.0, 20.0, 17.0, 22.0, 24.0, 25.0, 30.0, 23.0, 30.0, 37.0, 39.0, 33.0, 52.0, 35.0, 32.0, 41.0, 36.0, 35.0, 34.0, 36.0, 36.0, 24.0, 32.0, 31.0, 22.0, 29.0, 20.0, 24.0, 14.0, 12.0, 14.0, 9.0, 10.0, 3.0, 5.0, 8.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.4921875, -14.9857177734375, -14.479248046875, -13.9727783203125, -13.46630859375, -12.9598388671875, -12.453369140625, -11.9468994140625, -11.4404296875, -10.9339599609375, -10.427490234375, -9.9210205078125, -9.41455078125, -8.9080810546875, -8.401611328125, -7.8951416015625, -7.388671875, -6.8822021484375, -6.375732421875, -5.8692626953125, -5.36279296875, -4.8563232421875, -4.349853515625, -3.8433837890625, -3.3369140625, -2.8304443359375, -2.323974609375, -1.8175048828125, -1.31103515625, -0.8045654296875, -0.298095703125, 0.2083740234375, 0.71484375, 1.2213134765625, 1.727783203125, 2.2342529296875, 2.74072265625, 3.2471923828125, 3.753662109375, 4.2601318359375, 4.7666015625, 5.2730712890625, 5.779541015625, 6.2860107421875, 6.79248046875, 7.2989501953125, 7.805419921875, 8.3118896484375, 8.818359375, 9.3248291015625, 9.831298828125, 10.3377685546875, 10.84423828125, 11.3507080078125, 11.857177734375, 12.3636474609375, 12.8701171875, 13.3765869140625, 13.883056640625, 14.3895263671875, 14.89599609375, 15.4024658203125, 15.908935546875, 16.4154052734375, 16.921875]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 2.0, 7.0, 11.0, 5.0, 14.0, 28.0, 22.0, 29.0, 65.0, 91.0, 141.0, 166.0, 220.0, 358.0, 491.0, 783.0, 1246.0, 2072.0, 3687.0, 7742.0, 18914.0, 54655.0, 218005.0, 538978.0, 134346.0, 38291.0, 14031.0, 6112.0, 3061.0, 1738.0, 1078.0, 677.0, 492.0, 295.0, 224.0, 125.0, 103.0, 74.0, 48.0, 37.0, 25.0, 26.0, 14.0, 10.0, 2.0, 9.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.890625, -26.03271484375, -25.1748046875, -24.31689453125, -23.458984375, -22.60107421875, -21.7431640625, -20.88525390625, -20.02734375, -19.16943359375, -18.3115234375, -17.45361328125, -16.595703125, -15.73779296875, -14.8798828125, -14.02197265625, -13.1640625, -12.30615234375, -11.4482421875, -10.59033203125, -9.732421875, -8.87451171875, -8.0166015625, -7.15869140625, -6.30078125, -5.44287109375, -4.5849609375, -3.72705078125, -2.869140625, -2.01123046875, -1.1533203125, -0.29541015625, 0.5625, 1.42041015625, 2.2783203125, 3.13623046875, 3.994140625, 4.85205078125, 5.7099609375, 6.56787109375, 7.42578125, 8.28369140625, 9.1416015625, 9.99951171875, 10.857421875, 11.71533203125, 12.5732421875, 13.43115234375, 14.2890625, 15.14697265625, 16.0048828125, 16.86279296875, 17.720703125, 18.57861328125, 19.4365234375, 20.29443359375, 21.15234375, 22.01025390625, 22.8681640625, 23.72607421875, 24.583984375, 25.44189453125, 26.2998046875, 27.15771484375, 28.015625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 6.0, 6.0, 4.0, 8.0, 9.0, 14.0, 17.0, 23.0, 22.0, 27.0, 47.0, 41.0, 42.0, 49.0, 54.0, 77.0, 139.0, 1651.0, 291.0, 108.0, 78.0, 43.0, 32.0, 34.0, 25.0, 37.0, 30.0, 15.0, 22.0, 9.0, 13.0, 17.0, 13.0, 7.0, 8.0, 7.0, 6.0, 6.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.5625, -37.2685546875, -35.974609375, -34.6806640625, -33.38671875, -32.0927734375, -30.798828125, -29.5048828125, -28.2109375, -26.9169921875, -25.623046875, -24.3291015625, -23.03515625, -21.7412109375, -20.447265625, -19.1533203125, -17.859375, -16.5654296875, -15.271484375, -13.9775390625, -12.68359375, -11.3896484375, -10.095703125, -8.8017578125, -7.5078125, -6.2138671875, -4.919921875, -3.6259765625, -2.33203125, -1.0380859375, 0.255859375, 1.5498046875, 2.84375, 4.1376953125, 5.431640625, 6.7255859375, 8.01953125, 9.3134765625, 10.607421875, 11.9013671875, 13.1953125, 14.4892578125, 15.783203125, 17.0771484375, 18.37109375, 19.6650390625, 20.958984375, 22.2529296875, 23.546875, 24.8408203125, 26.134765625, 27.4287109375, 28.72265625, 30.0166015625, 31.310546875, 32.6044921875, 33.8984375, 35.1923828125, 36.486328125, 37.7802734375, 39.07421875, 40.3681640625, 41.662109375, 42.9560546875, 44.25]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 7.0, 4.0, 9.0, 13.0, 8.0, 17.0, 11.0, 29.0, 28.0, 39.0, 57.0, 84.0, 139.0, 236.0, 428.0, 976.0, 14239.0, 3117944.0, 9456.0, 910.0, 422.0, 205.0, 147.0, 97.0, 44.0, 34.0, 29.0, 25.0, 15.0, 12.0, 4.0, 6.0, 4.0, 5.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-132.25, -128.5205078125, -124.791015625, -121.0615234375, -117.33203125, -113.6025390625, -109.873046875, -106.1435546875, -102.4140625, -98.6845703125, -94.955078125, -91.2255859375, -87.49609375, -83.7666015625, -80.037109375, -76.3076171875, -72.578125, -68.8486328125, -65.119140625, -61.3896484375, -57.66015625, -53.9306640625, -50.201171875, -46.4716796875, -42.7421875, -39.0126953125, -35.283203125, -31.5537109375, -27.82421875, -24.0947265625, -20.365234375, -16.6357421875, -12.90625, -9.1767578125, -5.447265625, -1.7177734375, 2.01171875, 5.7412109375, 9.470703125, 13.2001953125, 16.9296875, 20.6591796875, 24.388671875, 28.1181640625, 31.84765625, 35.5771484375, 39.306640625, 43.0361328125, 46.765625, 50.4951171875, 54.224609375, 57.9541015625, 61.68359375, 65.4130859375, 69.142578125, 72.8720703125, 76.6015625, 80.3310546875, 84.060546875, 87.7900390625, 91.51953125, 95.2490234375, 98.978515625, 102.7080078125, 106.4375]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [2.0, 5.0, 218.0, 745.0, 45.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.54766082763672, -29.34783935546875, -16.14801597595215, -2.948192596435547, 10.251628875732422, 23.451454162597656, 36.651275634765625, 49.851097106933594, 63.05091857910156, 76.25074005126953, 89.4505615234375, 102.650390625, 115.85020446777344, 129.05003356933594, 142.24984741210938, 155.44967651367188, 168.64950561523438, 181.84933471679688, 195.0491485595703, 208.2489776611328, 221.44879150390625, 234.64862060546875, 247.84844970703125, 261.04827880859375, 274.2480773925781, 287.4479064941406, 300.6477355957031, 313.8475341796875, 327.04736328125, 340.2471923828125, 353.447021484375, 366.6468505859375, 379.8466491699219, 393.0464782714844, 406.2463073730469, 419.44610595703125, 432.64593505859375, 445.84576416015625, 459.04559326171875, 472.24542236328125, 485.4452209472656, 498.6450500488281, 511.8448791503906, 525.044677734375, 538.2445068359375, 551.4443359375, 564.6441650390625, 577.843994140625, 591.0438232421875, 604.24365234375, 617.4434814453125, 630.643310546875, 643.8431396484375, 657.04296875, 670.2427368164062, 683.4425659179688, 696.6423950195312, 709.8422241210938, 723.0420532226562, 736.2418823242188, 749.4417114257812, 762.6414794921875, 775.84130859375, 789.0411376953125, 802.240966796875]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 9.0, 17.0, 10.0, 16.0, 20.0, 22.0, 12.0, 24.0, 29.0, 44.0, 42.0, 31.0, 41.0, 44.0, 47.0, 44.0, 51.0, 58.0, 47.0, 62.0, 58.0, 30.0, 33.0, 28.0, 26.0, 20.0, 24.0, 26.0, 16.0, 11.0, 8.0, 11.0, 4.0, 8.0, 10.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.04360961914062, -88.7571792602539, -85.47074127197266, -82.18431091308594, -78.89787292480469, -75.61144256591797, -72.32500457763672, -69.03857421875, -65.75213623046875, -62.465702056884766, -59.17926788330078, -55.8928337097168, -52.60639953613281, -49.319969177246094, -46.033531188964844, -42.747100830078125, -39.46066665649414, -36.174232482910156, -32.88779830932617, -29.601364135742188, -26.314929962158203, -23.02849769592285, -19.742063522338867, -16.455629348754883, -13.169195175170898, -9.882761001586914, -6.596327304840088, -3.3098936080932617, -0.023459434509277344, 3.2629737854003906, 6.549407958984375, 9.83584213256836, 13.122276306152344, 16.408710479736328, 19.695144653320312, 22.981578826904297, 26.26801300048828, 29.554445266723633, 32.84088134765625, 36.12731170654297, 39.41374969482422, 42.7001838684082, 45.98661804199219, 49.27305221557617, 52.559486389160156, 55.845916748046875, 59.132354736328125, 62.418785095214844, 65.70521545410156, 68.99164581298828, 72.27808380126953, 75.56451416015625, 78.8509521484375, 82.13738250732422, 85.42382049560547, 88.71025085449219, 91.99668884277344, 95.28311920166016, 98.5695571899414, 101.85598754882812, 105.14242553710938, 108.4288558959961, 111.71529388427734, 115.00172424316406, 118.28816223144531]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 8.0, 8.0, 15.0, 11.0, 14.0, 17.0, 14.0, 15.0, 21.0, 28.0, 28.0, 28.0, 29.0, 31.0, 45.0, 44.0, 27.0, 42.0, 40.0, 54.0, 32.0, 46.0, 39.0, 46.0, 34.0, 30.0, 27.0, 40.0, 29.0, 19.0, 18.0, 18.0, 14.0, 17.0, 15.0, 10.0, 11.0, 10.0, 9.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-19.953125, -19.334228515625, -18.71533203125, -18.096435546875, -17.4775390625, -16.858642578125, -16.23974609375, -15.620849609375, -15.001953125, -14.383056640625, -13.76416015625, -13.145263671875, -12.5263671875, -11.907470703125, -11.28857421875, -10.669677734375, -10.05078125, -9.431884765625, -8.81298828125, -8.194091796875, -7.5751953125, -6.956298828125, -6.33740234375, -5.718505859375, -5.099609375, -4.480712890625, -3.86181640625, -3.242919921875, -2.6240234375, -2.005126953125, -1.38623046875, -0.767333984375, -0.1484375, 0.470458984375, 1.08935546875, 1.708251953125, 2.3271484375, 2.946044921875, 3.56494140625, 4.183837890625, 4.802734375, 5.421630859375, 6.04052734375, 6.659423828125, 7.2783203125, 7.897216796875, 8.51611328125, 9.135009765625, 9.75390625, 10.372802734375, 10.99169921875, 11.610595703125, 12.2294921875, 12.848388671875, 13.46728515625, 14.086181640625, 14.705078125, 15.323974609375, 15.94287109375, 16.561767578125, 17.1806640625, 17.799560546875, 18.41845703125, 19.037353515625, 19.65625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 3.0, 7.0, 11.0, 17.0, 22.0, 23.0, 42.0, 28.0, 49.0, 56.0, 89.0, 103.0, 160.0, 225.0, 303.0, 408.0, 745.0, 1433.0, 3392.0, 10002.0, 46533.0, 2334675.0, 1742237.0, 37996.0, 9049.0, 3088.0, 1378.0, 738.0, 418.0, 276.0, 193.0, 138.0, 123.0, 77.0, 58.0, 38.0, 27.0, 28.0, 23.0, 23.0, 9.0, 15.0, 6.0, 5.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-102.1875, -99.177734375, -96.16796875, -93.158203125, -90.1484375, -87.138671875, -84.12890625, -81.119140625, -78.109375, -75.099609375, -72.08984375, -69.080078125, -66.0703125, -63.060546875, -60.05078125, -57.041015625, -54.03125, -51.021484375, -48.01171875, -45.001953125, -41.9921875, -38.982421875, -35.97265625, -32.962890625, -29.953125, -26.943359375, -23.93359375, -20.923828125, -17.9140625, -14.904296875, -11.89453125, -8.884765625, -5.875, -2.865234375, 0.14453125, 3.154296875, 6.1640625, 9.173828125, 12.18359375, 15.193359375, 18.203125, 21.212890625, 24.22265625, 27.232421875, 30.2421875, 33.251953125, 36.26171875, 39.271484375, 42.28125, 45.291015625, 48.30078125, 51.310546875, 54.3203125, 57.330078125, 60.33984375, 63.349609375, 66.359375, 69.369140625, 72.37890625, 75.388671875, 78.3984375, 81.408203125, 84.41796875, 87.427734375, 90.4375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 3.0, 6.0, 8.0, 2.0, 9.0, 14.0, 13.0, 26.0, 30.0, 37.0, 39.0, 65.0, 96.0, 124.0, 211.0, 332.0, 575.0, 725.0, 667.0, 380.0, 222.0, 140.0, 77.0, 43.0, 58.0, 43.0, 24.0, 22.0, 26.0, 16.0, 7.0, 11.0, 7.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.71875, -40.2666015625, -38.814453125, -37.3623046875, -35.91015625, -34.4580078125, -33.005859375, -31.5537109375, -30.1015625, -28.6494140625, -27.197265625, -25.7451171875, -24.29296875, -22.8408203125, -21.388671875, -19.9365234375, -18.484375, -17.0322265625, -15.580078125, -14.1279296875, -12.67578125, -11.2236328125, -9.771484375, -8.3193359375, -6.8671875, -5.4150390625, -3.962890625, -2.5107421875, -1.05859375, 0.3935546875, 1.845703125, 3.2978515625, 4.75, 6.2021484375, 7.654296875, 9.1064453125, 10.55859375, 12.0107421875, 13.462890625, 14.9150390625, 16.3671875, 17.8193359375, 19.271484375, 20.7236328125, 22.17578125, 23.6279296875, 25.080078125, 26.5322265625, 27.984375, 29.4365234375, 30.888671875, 32.3408203125, 33.79296875, 35.2451171875, 36.697265625, 38.1494140625, 39.6015625, 41.0537109375, 42.505859375, 43.9580078125, 45.41015625, 46.8623046875, 48.314453125, 49.7666015625, 51.21875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 6.0, 6.0, 10.0, 14.0, 22.0, 33.0, 50.0, 73.0, 95.0, 135.0, 222.0, 387.0, 564.0, 945.0, 1691.0, 2769.0, 4921.0, 9045.0, 17941.0, 39378.0, 103583.0, 427657.0, 2757198.0, 612292.0, 125778.0, 45872.0, 20284.0, 10126.0, 5480.0, 3114.0, 1771.0, 1035.0, 645.0, 386.0, 251.0, 171.0, 107.0, 80.0, 49.0, 33.0, 22.0, 28.0, 8.0, 5.0, 3.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.8125, -34.80615234375, -33.7998046875, -32.79345703125, -31.787109375, -30.78076171875, -29.7744140625, -28.76806640625, -27.76171875, -26.75537109375, -25.7490234375, -24.74267578125, -23.736328125, -22.72998046875, -21.7236328125, -20.71728515625, -19.7109375, -18.70458984375, -17.6982421875, -16.69189453125, -15.685546875, -14.67919921875, -13.6728515625, -12.66650390625, -11.66015625, -10.65380859375, -9.6474609375, -8.64111328125, -7.634765625, -6.62841796875, -5.6220703125, -4.61572265625, -3.609375, -2.60302734375, -1.5966796875, -0.59033203125, 0.416015625, 1.42236328125, 2.4287109375, 3.43505859375, 4.44140625, 5.44775390625, 6.4541015625, 7.46044921875, 8.466796875, 9.47314453125, 10.4794921875, 11.48583984375, 12.4921875, 13.49853515625, 14.5048828125, 15.51123046875, 16.517578125, 17.52392578125, 18.5302734375, 19.53662109375, 20.54296875, 21.54931640625, 22.5556640625, 23.56201171875, 24.568359375, 25.57470703125, 26.5810546875, 27.58740234375, 28.59375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 5.0, 5.0, 11.0, 9.0, 11.0, 13.0, 13.0, 22.0, 19.0, 32.0, 45.0, 53.0, 66.0, 87.0, 91.0, 99.0, 84.0, 74.0, 55.0, 55.0, 33.0, 22.0, 14.0, 18.0, 13.0, 12.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-250.29344177246094, -243.0085906982422, -235.72372436523438, -228.43887329101562, -221.15402221679688, -213.86917114257812, -206.5843048095703, -199.29945373535156, -192.0146026611328, -184.72975158691406, -177.44488525390625, -170.1600341796875, -162.87518310546875, -155.59033203125, -148.3054656982422, -141.02061462402344, -133.73574829101562, -126.45088958740234, -119.1660385131836, -111.88117980957031, -104.59632873535156, -97.31147003173828, -90.026611328125, -82.74176025390625, -75.4569091796875, -68.17205047607422, -60.88719940185547, -53.60234069824219, -46.31748962402344, -39.032630920410156, -31.74777603149414, -24.462921142578125, -17.178070068359375, -9.89321517944336, -2.6083593368530273, 4.676496505737305, 11.96135139465332, 19.24620819091797, 26.531063079833984, 33.81591796875, 41.100772857666016, 48.38562774658203, 55.67048263549805, 62.95533752441406, 70.24019622802734, 77.52505493164062, 84.80990600585938, 92.09475708007812, 99.3796157836914, 106.66447448730469, 113.94932556152344, 121.23418426513672, 128.51904296875, 135.80389404296875, 143.0887451171875, 150.37359619140625, 157.65846252441406, 164.9433135986328, 172.22817993164062, 179.51303100585938, 186.79788208007812, 194.08273315429688, 201.3675994873047, 208.65245056152344, 215.9373016357422]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 8.0, 5.0, 4.0, 3.0, 9.0, 9.0, 10.0, 9.0, 13.0, 28.0, 30.0, 21.0, 31.0, 28.0, 26.0, 32.0, 28.0, 28.0, 35.0, 48.0, 54.0, 35.0, 46.0, 40.0, 46.0, 33.0, 40.0, 46.0, 27.0, 28.0, 25.0, 22.0, 27.0, 27.0, 15.0, 10.0, 15.0, 13.0, 10.0, 7.0, 10.0, 6.0, 5.0, 8.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-187.38294982910156, -182.02053833007812, -176.65814208984375, -171.2957305908203, -165.93331909179688, -160.5709228515625, -155.20851135253906, -149.84609985351562, -144.48370361328125, -139.1212921142578, -133.75889587402344, -128.396484375, -123.03407287597656, -117.67166900634766, -112.30926513671875, -106.94685363769531, -101.58444213867188, -96.22203826904297, -90.85962677001953, -85.49722290039062, -80.13481140136719, -74.77240753173828, -69.41000366210938, -64.04759216308594, -58.68518829345703, -53.32278060913086, -47.96037292480469, -42.59796905517578, -37.23556137084961, -31.873153686523438, -26.51074981689453, -21.14834213256836, -15.78594970703125, -10.423542976379395, -5.061136245727539, 0.30126953125, 5.663677215576172, 11.026084899902344, 16.38848876953125, 21.750896453857422, 27.113304138183594, 32.475711822509766, 37.83811950683594, 43.200523376464844, 48.562931060791016, 53.92533874511719, 59.287742614746094, 64.650146484375, 70.01255798339844, 75.37496185302734, 80.73737335205078, 86.09977722167969, 91.46218872070312, 96.82459259033203, 102.18699645996094, 107.54940795898438, 112.91181182861328, 118.27421569824219, 123.63662719726562, 128.9990234375, 134.36143493652344, 139.72384643554688, 145.08624267578125, 150.4486541748047, 155.81106567382812]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 8.0, 3.0, 12.0, 10.0, 13.0, 16.0, 31.0, 23.0, 31.0, 43.0, 28.0, 36.0, 32.0, 52.0, 64.0, 53.0, 52.0, 48.0, 56.0, 53.0, 38.0, 45.0, 40.0, 29.0, 35.0, 20.0, 31.0, 21.0, 10.0, 12.0, 11.0, 12.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-310.0, -299.90234375, -289.8046875, -279.70703125, -269.609375, -259.51171875, -249.4140625, -239.31640625, -229.21875, -219.12109375, -209.0234375, -198.92578125, -188.828125, -178.73046875, -168.6328125, -158.53515625, -148.4375, -138.33984375, -128.2421875, -118.14453125, -108.046875, -97.94921875, -87.8515625, -77.75390625, -67.65625, -57.55859375, -47.4609375, -37.36328125, -27.265625, -17.16796875, -7.0703125, 3.02734375, 13.125, 23.22265625, 33.3203125, 43.41796875, 53.515625, 63.61328125, 73.7109375, 83.80859375, 93.90625, 104.00390625, 114.1015625, 124.19921875, 134.296875, 144.39453125, 154.4921875, 164.58984375, 174.6875, 184.78515625, 194.8828125, 204.98046875, 215.078125, 225.17578125, 235.2734375, 245.37109375, 255.46875, 265.56640625, 275.6640625, 285.76171875, 295.859375, 305.95703125, 316.0546875, 326.15234375, 336.25]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 3.0, 6.0, 3.0, 5.0, 17.0, 15.0, 20.0, 30.0, 49.0, 83.0, 134.0, 231.0, 306.0, 518.0, 817.0, 1249.0, 2058.0, 3184.0, 4965.0, 7805.0, 12815.0, 21728.0, 37977.0, 71248.0, 148373.0, 316400.0, 206816.0, 94182.0, 48712.0, 27115.0, 15850.0, 9514.0, 5850.0, 3874.0, 2428.0, 1460.0, 988.0, 605.0, 399.0, 257.0, 188.0, 95.0, 60.0, 54.0, 19.0, 19.0, 11.0, 9.0, 6.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0], "bins": [-31.65625, -30.688232421875, -29.72021484375, -28.752197265625, -27.7841796875, -26.816162109375, -25.84814453125, -24.880126953125, -23.912109375, -22.944091796875, -21.97607421875, -21.008056640625, -20.0400390625, -19.072021484375, -18.10400390625, -17.135986328125, -16.16796875, -15.199951171875, -14.23193359375, -13.263916015625, -12.2958984375, -11.327880859375, -10.35986328125, -9.391845703125, -8.423828125, -7.455810546875, -6.48779296875, -5.519775390625, -4.5517578125, -3.583740234375, -2.61572265625, -1.647705078125, -0.6796875, 0.288330078125, 1.25634765625, 2.224365234375, 3.1923828125, 4.160400390625, 5.12841796875, 6.096435546875, 7.064453125, 8.032470703125, 9.00048828125, 9.968505859375, 10.9365234375, 11.904541015625, 12.87255859375, 13.840576171875, 14.80859375, 15.776611328125, 16.74462890625, 17.712646484375, 18.6806640625, 19.648681640625, 20.61669921875, 21.584716796875, 22.552734375, 23.520751953125, 24.48876953125, 25.456787109375, 26.4248046875, 27.392822265625, 28.36083984375, 29.328857421875, 30.296875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 3.0, 4.0, 6.0, 14.0, 13.0, 13.0, 20.0, 23.0, 20.0, 24.0, 26.0, 32.0, 33.0, 28.0, 27.0, 36.0, 41.0, 37.0, 45.0, 1066.0, 52.0, 38.0, 43.0, 30.0, 40.0, 32.0, 42.0, 28.0, 29.0, 36.0, 19.0, 23.0, 29.0, 8.0, 16.0, 8.0, 11.0, 6.0, 8.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-176.625, -171.046875, -165.46875, -159.890625, -154.3125, -148.734375, -143.15625, -137.578125, -132.0, -126.421875, -120.84375, -115.265625, -109.6875, -104.109375, -98.53125, -92.953125, -87.375, -81.796875, -76.21875, -70.640625, -65.0625, -59.484375, -53.90625, -48.328125, -42.75, -37.171875, -31.59375, -26.015625, -20.4375, -14.859375, -9.28125, -3.703125, 1.875, 7.453125, 13.03125, 18.609375, 24.1875, 29.765625, 35.34375, 40.921875, 46.5, 52.078125, 57.65625, 63.234375, 68.8125, 74.390625, 79.96875, 85.546875, 91.125, 96.703125, 102.28125, 107.859375, 113.4375, 119.015625, 124.59375, 130.171875, 135.75, 141.328125, 146.90625, 152.484375, 158.0625, 163.640625, 169.21875, 174.796875, 180.375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 8.0, 2.0, 8.0, 14.0, 17.0, 28.0, 38.0, 62.0, 80.0, 154.0, 205.0, 339.0, 528.0, 885.0, 1511.0, 2572.0, 4620.0, 7653.0, 13340.0, 23728.0, 43258.0, 81950.0, 183222.0, 1404762.0, 161017.0, 75228.0, 40414.0, 21621.0, 12634.0, 7137.0, 4007.0, 2408.0, 1433.0, 802.0, 517.0, 335.0, 196.0, 132.0, 95.0, 57.0, 38.0, 26.0, 22.0, 11.0, 10.0, 4.0, 5.0, 6.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-32.375, -31.434814453125, -30.49462890625, -29.554443359375, -28.6142578125, -27.674072265625, -26.73388671875, -25.793701171875, -24.853515625, -23.913330078125, -22.97314453125, -22.032958984375, -21.0927734375, -20.152587890625, -19.21240234375, -18.272216796875, -17.33203125, -16.391845703125, -15.45166015625, -14.511474609375, -13.5712890625, -12.631103515625, -11.69091796875, -10.750732421875, -9.810546875, -8.870361328125, -7.93017578125, -6.989990234375, -6.0498046875, -5.109619140625, -4.16943359375, -3.229248046875, -2.2890625, -1.348876953125, -0.40869140625, 0.531494140625, 1.4716796875, 2.411865234375, 3.35205078125, 4.292236328125, 5.232421875, 6.172607421875, 7.11279296875, 8.052978515625, 8.9931640625, 9.933349609375, 10.87353515625, 11.813720703125, 12.75390625, 13.694091796875, 14.63427734375, 15.574462890625, 16.5146484375, 17.454833984375, 18.39501953125, 19.335205078125, 20.275390625, 21.215576171875, 22.15576171875, 23.095947265625, 24.0361328125, 24.976318359375, 25.91650390625, 26.856689453125, 27.796875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 5.0, 4.0, 16.0, 12.0, 22.0, 25.0, 30.0, 34.0, 41.0, 55.0, 66.0, 70.0, 77.0, 76.0, 67.0, 81.0, 60.0, 56.0, 50.0, 35.0, 38.0, 14.0, 17.0, 17.0, 7.0, 5.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11590576171875, -0.11232948303222656, -0.10875320434570312, -0.10517692565917969, -0.10160064697265625, -0.09802436828613281, -0.09444808959960938, -0.09087181091308594, -0.0872955322265625, -0.08371925354003906, -0.08014297485351562, -0.07656669616699219, -0.07299041748046875, -0.06941413879394531, -0.06583786010742188, -0.06226158142089844, -0.058685302734375, -0.05510902404785156, -0.051532745361328125, -0.04795646667480469, -0.04438018798828125, -0.04080390930175781, -0.037227630615234375, -0.03365135192871094, -0.0300750732421875, -0.026498794555664062, -0.022922515869140625, -0.019346237182617188, -0.01576995849609375, -0.012193679809570312, -0.008617401123046875, -0.0050411224365234375, -0.00146484375, 0.0021114349365234375, 0.005687713623046875, 0.009263992309570312, 0.01284027099609375, 0.016416549682617188, 0.019992828369140625, 0.023569107055664062, 0.0271453857421875, 0.030721664428710938, 0.034297943115234375, 0.03787422180175781, 0.04145050048828125, 0.04502677917480469, 0.048603057861328125, 0.05217933654785156, 0.055755615234375, 0.05933189392089844, 0.06290817260742188, 0.06648445129394531, 0.07006072998046875, 0.07363700866699219, 0.07721328735351562, 0.08078956604003906, 0.0843658447265625, 0.08794212341308594, 0.09151840209960938, 0.09509468078613281, 0.09867095947265625, 0.10224723815917969, 0.10582351684570312, 0.10939979553222656, 0.11297607421875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 18.0, 19.0, 15.0, 20.0, 33.0, 36.0, 61.0, 65.0, 98.0, 150.0, 183.0, 266.0, 481.0, 823.0, 1769.0, 4061.0, 11602.0, 38836.0, 165343.0, 542174.0, 211415.0, 48095.0, 13816.0, 4716.0, 1916.0, 922.0, 516.0, 308.0, 218.0, 157.0, 88.0, 79.0, 52.0, 45.0, 34.0, 24.0, 15.0, 22.0, 17.0, 5.0, 4.0, 3.0, 3.0, 5.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.65625, -0.635467529296875, -0.61468505859375, -0.593902587890625, -0.5731201171875, -0.552337646484375, -0.53155517578125, -0.510772705078125, -0.489990234375, -0.469207763671875, -0.44842529296875, -0.427642822265625, -0.4068603515625, -0.386077880859375, -0.36529541015625, -0.344512939453125, -0.32373046875, -0.302947998046875, -0.28216552734375, -0.261383056640625, -0.2406005859375, -0.219818115234375, -0.19903564453125, -0.178253173828125, -0.157470703125, -0.136688232421875, -0.11590576171875, -0.095123291015625, -0.0743408203125, -0.053558349609375, -0.03277587890625, -0.011993408203125, 0.0087890625, 0.029571533203125, 0.05035400390625, 0.071136474609375, 0.0919189453125, 0.112701416015625, 0.13348388671875, 0.154266357421875, 0.175048828125, 0.195831298828125, 0.21661376953125, 0.237396240234375, 0.2581787109375, 0.278961181640625, 0.29974365234375, 0.320526123046875, 0.34130859375, 0.362091064453125, 0.38287353515625, 0.403656005859375, 0.4244384765625, 0.445220947265625, 0.46600341796875, 0.486785888671875, 0.507568359375, 0.528350830078125, 0.54913330078125, 0.569915771484375, 0.5906982421875, 0.611480712890625, 0.63226318359375, 0.653045654296875, 0.673828125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 0.0, 8.0, 7.0, 12.0, 23.0, 50.0, 87.0, 165.0, 256.0, 188.0, 100.0, 53.0, 32.0, 15.0, 6.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13805687427520752, -0.13064159452915192, -0.12322630733251572, -0.11581102758646011, -0.10839574784040451, -0.10098046064376831, -0.09356518089771271, -0.0861499011516571, -0.0787346214056015, -0.0713193416595459, -0.0639040544629097, -0.056488774716854095, -0.04907349497079849, -0.04165821149945259, -0.03424292802810669, -0.026827648282051086, -0.019412361085414886, -0.011997079476714134, -0.004581796936690807, 0.0028334856033325195, 0.010248767212033272, 0.017664048820734024, 0.025079332292079926, 0.03249461203813553, 0.03990989550948143, 0.04732517898082733, 0.054740458726882935, 0.062155742198228836, 0.06957102566957474, 0.07698630541563034, 0.08440159261226654, 0.09181687235832214, 0.09923215210437775, 0.10664743185043335, 0.11406271904706955, 0.12147799879312515, 0.12889328598976135, 0.13630856573581696, 0.14372384548187256, 0.15113912522792816, 0.15855440497398376, 0.16596968472003937, 0.17338496446609497, 0.18080025911331177, 0.18821553885936737, 0.19563081860542297, 0.20304609835147858, 0.21046137809753418, 0.21787667274475098, 0.22529195249080658, 0.23270723223686218, 0.24012252688407898, 0.24753780663013458, 0.2549530863761902, 0.262368381023407, 0.2697836458683014, 0.2771989107131958, 0.2846142053604126, 0.292029470205307, 0.2994447648525238, 0.3068600296974182, 0.314275324344635, 0.3216906189918518, 0.3291058838367462, 0.336521178483963]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 10.0, 5.0, 8.0, 9.0, 6.0, 12.0, 20.0, 16.0, 30.0, 26.0, 25.0, 24.0, 30.0, 37.0, 29.0, 51.0, 42.0, 45.0, 38.0, 41.0, 42.0, 41.0, 44.0, 31.0, 28.0, 26.0, 34.0, 29.0, 31.0, 28.0, 19.0, 26.0, 20.0, 17.0, 21.0, 10.0, 5.0, 9.0, 5.0, 8.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.054158806800842285, -0.05260934308171272, -0.05105987936258316, -0.0495104156434536, -0.047960951924324036, -0.04641148820519447, -0.04486202448606491, -0.04331256076693535, -0.041763097047805786, -0.040213633328676224, -0.03866416960954666, -0.0371147058904171, -0.03556524217128754, -0.034015778452157974, -0.03246631473302841, -0.03091685101389885, -0.029367387294769287, -0.027817923575639725, -0.026268459856510162, -0.0247189961373806, -0.023169532418251038, -0.021620068699121475, -0.020070604979991913, -0.01852114126086235, -0.016971677541732788, -0.015422213822603226, -0.013872750103473663, -0.012323286384344101, -0.010773822665214539, -0.009224358946084976, -0.007674895226955414, -0.0061254315078258514, -0.004575967788696289, -0.0030265040695667267, -0.0014770403504371643, 7.242336869239807e-05, 0.0016218870878219604, 0.003171350806951523, 0.004720814526081085, 0.006270278245210648, 0.00781974196434021, 0.009369205683469772, 0.010918669402599335, 0.012468133121728897, 0.01401759684085846, 0.015567060559988022, 0.017116524279117584, 0.018665987998247147, 0.02021545171737671, 0.02176491543650627, 0.023314379155635834, 0.024863842874765396, 0.02641330659389496, 0.02796277031302452, 0.029512234032154083, 0.031061697751283646, 0.03261116147041321, 0.03416062518954277, 0.03571008890867233, 0.037259552627801895, 0.03880901634693146, 0.04035848006606102, 0.04190794378519058, 0.043457407504320145, 0.04500687122344971]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 8.0, 5.0, 9.0, 2.0, 12.0, 10.0, 13.0, 16.0, 31.0, 23.0, 31.0, 43.0, 29.0, 35.0, 32.0, 52.0, 64.0, 53.0, 52.0, 48.0, 56.0, 54.0, 37.0, 45.0, 40.0, 29.0, 35.0, 20.0, 31.0, 21.0, 10.0, 12.0, 11.0, 12.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-310.0, -299.90234375, -289.8046875, -279.70703125, -269.609375, -259.51171875, -249.4140625, -239.31640625, -229.21875, -219.12109375, -209.0234375, -198.92578125, -188.828125, -178.73046875, -168.6328125, -158.53515625, -148.4375, -138.33984375, -128.2421875, -118.14453125, -108.046875, -97.94921875, -87.8515625, -77.75390625, -67.65625, -57.55859375, -47.4609375, -37.36328125, -27.265625, -17.16796875, -7.0703125, 3.02734375, 13.125, 23.22265625, 33.3203125, 43.41796875, 53.515625, 63.61328125, 73.7109375, 83.80859375, 93.90625, 104.00390625, 114.1015625, 124.19921875, 134.296875, 144.39453125, 154.4921875, 164.58984375, 174.6875, 184.78515625, 194.8828125, 204.98046875, 215.078125, 225.17578125, 235.2734375, 245.37109375, 255.46875, 265.56640625, 275.6640625, 285.76171875, 295.859375, 305.95703125, 316.0546875, 326.15234375, 336.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 6.0, 6.0, 9.0, 9.0, 18.0, 30.0, 26.0, 60.0, 68.0, 115.0, 204.0, 403.0, 673.0, 1309.0, 3096.0, 8711.0, 37374.0, 290845.0, 620032.0, 64836.0, 13103.0, 3921.0, 1730.0, 827.0, 453.0, 274.0, 137.0, 77.0, 65.0, 40.0, 30.0, 16.0, 14.0, 16.0, 7.0, 7.0, 3.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.6875, -84.873046875, -82.05859375, -79.244140625, -76.4296875, -73.615234375, -70.80078125, -67.986328125, -65.171875, -62.357421875, -59.54296875, -56.728515625, -53.9140625, -51.099609375, -48.28515625, -45.470703125, -42.65625, -39.841796875, -37.02734375, -34.212890625, -31.3984375, -28.583984375, -25.76953125, -22.955078125, -20.140625, -17.326171875, -14.51171875, -11.697265625, -8.8828125, -6.068359375, -3.25390625, -0.439453125, 2.375, 5.189453125, 8.00390625, 10.818359375, 13.6328125, 16.447265625, 19.26171875, 22.076171875, 24.890625, 27.705078125, 30.51953125, 33.333984375, 36.1484375, 38.962890625, 41.77734375, 44.591796875, 47.40625, 50.220703125, 53.03515625, 55.849609375, 58.6640625, 61.478515625, 64.29296875, 67.107421875, 69.921875, 72.736328125, 75.55078125, 78.365234375, 81.1796875, 83.994140625, 86.80859375, 89.623046875, 92.4375]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 11.0, 12.0, 30.0, 34.0, 50.0, 65.0, 79.0, 92.0, 195.0, 2075.0, 91.0, 83.0, 69.0, 48.0, 40.0, 31.0, 17.0, 7.0, 9.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-732.5, -711.015625, -689.53125, -668.046875, -646.5625, -625.078125, -603.59375, -582.109375, -560.625, -539.140625, -517.65625, -496.171875, -474.6875, -453.203125, -431.71875, -410.234375, -388.75, -367.265625, -345.78125, -324.296875, -302.8125, -281.328125, -259.84375, -238.359375, -216.875, -195.390625, -173.90625, -152.421875, -130.9375, -109.453125, -87.96875, -66.484375, -45.0, -23.515625, -2.03125, 19.453125, 40.9375, 62.421875, 83.90625, 105.390625, 126.875, 148.359375, 169.84375, 191.328125, 212.8125, 234.296875, 255.78125, 277.265625, 298.75, 320.234375, 341.71875, 363.203125, 384.6875, 406.171875, 427.65625, 449.140625, 470.625, 492.109375, 513.59375, 535.078125, 556.5625, 578.046875, 599.53125, 621.015625, 642.5]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 15.0, 12.0, 9.0, 22.0, 36.0, 63.0, 97.0, 168.0, 249.0, 524.0, 1199.0, 3745.0, 37280.0, 2989648.0, 103255.0, 6334.0, 1628.0, 648.0, 302.0, 172.0, 106.0, 76.0, 30.0, 28.0, 16.0, 15.0, 4.0, 4.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.875, -114.865234375, -110.85546875, -106.845703125, -102.8359375, -98.826171875, -94.81640625, -90.806640625, -86.796875, -82.787109375, -78.77734375, -74.767578125, -70.7578125, -66.748046875, -62.73828125, -58.728515625, -54.71875, -50.708984375, -46.69921875, -42.689453125, -38.6796875, -34.669921875, -30.66015625, -26.650390625, -22.640625, -18.630859375, -14.62109375, -10.611328125, -6.6015625, -2.591796875, 1.41796875, 5.427734375, 9.4375, 13.447265625, 17.45703125, 21.466796875, 25.4765625, 29.486328125, 33.49609375, 37.505859375, 41.515625, 45.525390625, 49.53515625, 53.544921875, 57.5546875, 61.564453125, 65.57421875, 69.583984375, 73.59375, 77.603515625, 81.61328125, 85.623046875, 89.6328125, 93.642578125, 97.65234375, 101.662109375, 105.671875, 109.681640625, 113.69140625, 117.701171875, 121.7109375, 125.720703125, 129.73046875, 133.740234375, 137.75]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 3.0, 12.0, 25.0, 60.0, 163.0, 331.0, 230.0, 102.0, 39.0, 18.0, 6.0, 8.0, 7.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-405.2336730957031, -370.47528076171875, -335.7169189453125, -300.9585266113281, -266.20013427734375, -231.44174194335938, -196.68336486816406, -161.92498779296875, -127.16659545898438, -92.40821075439453, -57.64982604980469, -22.891441345214844, 11.866943359375, 46.625335693359375, 81.38371276855469, 116.14208984375, 150.90048217773438, 185.65887451171875, 220.41725158691406, 255.17562866210938, 289.93402099609375, 324.6924133300781, 359.4508056640625, 394.20916748046875, 428.9675598144531, 463.7259521484375, 498.48431396484375, 533.2427368164062, 568.0010986328125, 602.759521484375, 637.5178833007812, 672.2762451171875, 707.0345458984375, 741.7929077148438, 776.5513305664062, 811.3096923828125, 846.068115234375, 880.8264770507812, 915.5848388671875, 950.34326171875, 985.1016235351562, 1019.8599853515625, 1054.618408203125, 1089.3768310546875, 1124.1351318359375, 1158.8935546875, 1193.6519775390625, 1228.4102783203125, 1263.168701171875, 1297.9271240234375, 1332.6854248046875, 1367.44384765625, 1402.2022705078125, 1436.960693359375, 1471.718994140625, 1506.4774169921875, 1541.23583984375, 1575.9942626953125, 1610.7525634765625, 1645.510986328125, 1680.2694091796875, 1715.02783203125, 1749.7861328125, 1784.5445556640625, 1819.3028564453125]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 5.0, 4.0, 8.0, 6.0, 6.0, 9.0, 13.0, 15.0, 15.0, 14.0, 18.0, 25.0, 24.0, 20.0, 32.0, 34.0, 32.0, 30.0, 43.0, 39.0, 42.0, 42.0, 44.0, 41.0, 47.0, 36.0, 42.0, 26.0, 34.0, 35.0, 33.0, 30.0, 23.0, 28.0, 17.0, 15.0, 15.0, 21.0, 12.0, 1.0, 7.0, 9.0, 4.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-398.3939208984375, -385.4479675292969, -372.5019836425781, -359.5560302734375, -346.6100769042969, -333.66412353515625, -320.7181396484375, -307.7721862792969, -294.82623291015625, -281.8802795410156, -268.9342956542969, -255.98834228515625, -243.04238891601562, -230.09642028808594, -217.15045166015625, -204.20449829101562, -191.25851440429688, -178.3125457763672, -165.36659240722656, -152.42062377929688, -139.47467041015625, -126.52870178222656, -113.58273315429688, -100.63677215576172, -87.69081115722656, -74.7448501586914, -61.798885345458984, -48.85292053222656, -35.906959533691406, -22.96099853515625, -10.015029907226562, 2.9309310913085938, 15.87689208984375, 28.82285499572754, 41.76881790161133, 54.71478271484375, 67.6607437133789, 80.60670471191406, 93.55267333984375, 106.4986343383789, 119.44459533691406, 132.39056396484375, 145.33651733398438, 158.28248596191406, 171.22845458984375, 184.17440795898438, 197.12037658691406, 210.06634521484375, 223.01229858398438, 235.95826721191406, 248.9042205810547, 261.8501892089844, 274.796142578125, 287.74212646484375, 300.6880798339844, 313.634033203125, 326.58001708984375, 339.5259704589844, 352.4719543457031, 365.41790771484375, 378.3638610839844, 391.309814453125, 404.25579833984375, 417.2017517089844, 430.147705078125]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 6.0, 1.0, 1.0, 4.0, 1.0, 6.0, 9.0, 11.0, 15.0, 19.0, 23.0, 20.0, 26.0, 27.0, 43.0, 78.0, 103.0, 172.0, 240.0, 367.0, 493.0, 1062.0, 1043310.0, 930.0, 487.0, 340.0, 232.0, 164.0, 99.0, 53.0, 48.0, 33.0, 24.0, 27.0, 15.0, 11.0, 15.0, 6.0, 11.0, 6.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-217.81832885742188, -209.8820343017578, -201.94573974609375, -194.00946044921875, -186.0731658935547, -178.13687133789062, -170.20057678222656, -162.2642822265625, -154.3280029296875, -146.39170837402344, -138.45541381835938, -130.51913452148438, -122.58283996582031, -114.64654541015625, -106.71025085449219, -98.77395629882812, -90.83766174316406, -82.9013671875, -74.96508026123047, -67.0287857055664, -59.09249496459961, -51.15620422363281, -43.21990966796875, -35.28361892700195, -27.347328186035156, -19.41103744506836, -11.47474479675293, -3.5384521484375, 4.397838592529297, 12.334129333496094, 20.270423889160156, 28.206714630126953, 36.14300537109375, 44.07929611206055, 52.015586853027344, 59.951881408691406, 67.88816833496094, 75.824462890625, 83.76075744628906, 91.69705200195312, 99.63333892822266, 107.56963348388672, 115.50592041015625, 123.44221496582031, 131.37850952148438, 139.31478881835938, 147.2510986328125, 155.1873779296875, 163.12367248535156, 171.05996704101562, 178.9962615966797, 186.93255615234375, 194.86883544921875, 202.8051300048828, 210.74142456054688, 218.67771911621094, 226.614013671875, 234.55030822753906, 242.48660278320312, 250.42288208007812, 258.35919189453125, 266.29547119140625, 274.23175048828125, 282.1680603027344, 290.1043395996094]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 2.0, 2.0, 7.0, 8.0, 5.0, 5.0, 4.0, 9.0, 7.0, 7.0, 11.0, 16.0, 30.0, 57.0, 330.0, 51457168.0, 5207.0, 134.0, 53.0, 34.0, 15.0, 9.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 6.0, 3.0, 0.0, 6.0, 1.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2042.0, -1933.6817626953125, -1825.3634033203125, -1717.045166015625, -1608.726806640625, -1500.4085693359375, -1392.09033203125, -1283.77197265625, -1175.45361328125, -1067.1353759765625, -958.8170166015625, -850.498779296875, -742.180419921875, -633.8621826171875, -525.5438842773438, -417.2255859375, -308.9073486328125, -200.58905029296875, -92.27076721191406, 16.047515869140625, 124.36581420898438, 232.68408203125, 341.00238037109375, 449.3206787109375, 557.6389770507812, 665.957275390625, 774.2755737304688, 882.5938720703125, 990.912109375, 1099.23046875, 1207.5487060546875, 1315.866943359375, 1424.185302734375, 1532.5035400390625, 1640.8218994140625, 1749.14013671875, 1857.45849609375, 1965.7767333984375, 2074.094970703125, 2182.413330078125, 2290.731689453125, 2399.050048828125, 2507.3681640625, 2615.6865234375, 2724.0048828125, 2832.3232421875, 2940.641357421875, 3048.959716796875, 3157.27783203125, 3265.59619140625, 3373.914306640625, 3482.232666015625, 3590.551025390625, 3698.869140625, 3807.1875, 3915.505859375, 4023.82421875, 4132.142578125, 4240.4609375, 4348.779296875, 4457.09716796875, 4565.41552734375, 4673.73388671875, 4782.05224609375, 4890.37060546875]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 7.0, 6.0, 18.0, 17.0, 23.0, 36.0, 42.0, 74.0, 108.0, 140.0, 248.0, 362.0, 558.0, 999.0, 1568.0, 2593.0, 4209.0, 7293.0, 12648.0, 22206.0, 40616.0, 72942.0, 139600.0, 290390.0, 767372.0, 4102404.0, 419257.0, 189191.0, 96440.0, 51837.0, 28946.0, 16350.0, 9172.0, 5461.0, 3036.0, 1938.0, 1239.0, 739.0, 515.0, 299.0, 180.0, 122.0, 74.0, 58.0, 32.0, 13.0, 17.0, 13.0, 12.0, 5.0, 6.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0], "bins": [-12.3515625, -11.9559326171875, -11.560302734375, -11.1646728515625, -10.76904296875, -10.3734130859375, -9.977783203125, -9.5821533203125, -9.1865234375, -8.7908935546875, -8.395263671875, -7.9996337890625, -7.60400390625, -7.2083740234375, -6.812744140625, -6.4171142578125, -6.021484375, -5.6258544921875, -5.230224609375, -4.8345947265625, -4.43896484375, -4.0433349609375, -3.647705078125, -3.2520751953125, -2.8564453125, -2.4608154296875, -2.065185546875, -1.6695556640625, -1.27392578125, -0.8782958984375, -0.482666015625, -0.0870361328125, 0.30859375, 0.7042236328125, 1.099853515625, 1.4954833984375, 1.89111328125, 2.2867431640625, 2.682373046875, 3.0780029296875, 3.4736328125, 3.8692626953125, 4.264892578125, 4.6605224609375, 5.05615234375, 5.4517822265625, 5.847412109375, 6.2430419921875, 6.638671875, 7.0343017578125, 7.429931640625, 7.8255615234375, 8.22119140625, 8.6168212890625, 9.012451171875, 9.4080810546875, 9.8037109375, 10.1993408203125, 10.594970703125, 10.9906005859375, 11.38623046875, 11.7818603515625, 12.177490234375, 12.5731201171875, 12.96875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 9.0, 5.0, 8.0, 9.0, 11.0, 20.0, 22.0, 24.0, 29.0, 45.0, 35.0, 39.0, 42.0, 32.0, 56.0, 54.0, 205.0, 911.0, 63.0, 51.0, 35.0, 50.0, 39.0, 42.0, 29.0, 36.0, 24.0, 22.0, 21.0, 16.0, 13.0, 6.0, 5.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.75, -71.5947265625, -69.439453125, -67.2841796875, -65.12890625, -62.9736328125, -60.818359375, -58.6630859375, -56.5078125, -54.3525390625, -52.197265625, -50.0419921875, -47.88671875, -45.7314453125, -43.576171875, -41.4208984375, -39.265625, -37.1103515625, -34.955078125, -32.7998046875, -30.64453125, -28.4892578125, -26.333984375, -24.1787109375, -22.0234375, -19.8681640625, -17.712890625, -15.5576171875, -13.40234375, -11.2470703125, -9.091796875, -6.9365234375, -4.78125, -2.6259765625, -0.470703125, 1.6845703125, 3.83984375, 5.9951171875, 8.150390625, 10.3056640625, 12.4609375, 14.6162109375, 16.771484375, 18.9267578125, 21.08203125, 23.2373046875, 25.392578125, 27.5478515625, 29.703125, 31.8583984375, 34.013671875, 36.1689453125, 38.32421875, 40.4794921875, 42.634765625, 44.7900390625, 46.9453125, 49.1005859375, 51.255859375, 53.4111328125, 55.56640625, 57.7216796875, 59.876953125, 62.0322265625, 64.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 9.0, 9.0, 13.0, 20.0, 19.0, 27.0, 43.0, 56.0, 99.0, 144.0, 171.0, 265.0, 384.0, 590.0, 889.0, 1249.0, 1826.0, 2819.0, 4279.0, 6395.0, 9985.0, 15882.0, 25960.0, 42648.0, 71601.0, 123215.0, 225347.0, 452834.0, 3808540.0, 772731.0, 316514.0, 167071.0, 94447.0, 55046.0, 33295.0, 20360.0, 12765.0, 8120.0, 5335.0, 3441.0, 2223.0, 1488.0, 1016.0, 684.0, 476.0, 362.0, 248.0, 171.0, 115.0, 80.0, 48.0, 38.0, 22.0, 13.0, 13.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-10.234375, -9.912109375, -9.58984375, -9.267578125, -8.9453125, -8.623046875, -8.30078125, -7.978515625, -7.65625, -7.333984375, -7.01171875, -6.689453125, -6.3671875, -6.044921875, -5.72265625, -5.400390625, -5.078125, -4.755859375, -4.43359375, -4.111328125, -3.7890625, -3.466796875, -3.14453125, -2.822265625, -2.5, -2.177734375, -1.85546875, -1.533203125, -1.2109375, -0.888671875, -0.56640625, -0.244140625, 0.078125, 0.400390625, 0.72265625, 1.044921875, 1.3671875, 1.689453125, 2.01171875, 2.333984375, 2.65625, 2.978515625, 3.30078125, 3.623046875, 3.9453125, 4.267578125, 4.58984375, 4.912109375, 5.234375, 5.556640625, 5.87890625, 6.201171875, 6.5234375, 6.845703125, 7.16796875, 7.490234375, 7.8125, 8.134765625, 8.45703125, 8.779296875, 9.1015625, 9.423828125, 9.74609375, 10.068359375, 10.390625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 9.0, 12.0, 12.0, 17.0, 18.0, 23.0, 27.0, 22.0, 38.0, 26.0, 30.0, 37.0, 39.0, 49.0, 44.0, 145.0, 879.0, 111.0, 60.0, 40.0, 45.0, 39.0, 43.0, 32.0, 28.0, 28.0, 15.0, 17.0, 23.0, 15.0, 13.0, 19.0, 7.0, 7.0, 12.0, 4.0, 9.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-42.03125, -40.73388671875, -39.4365234375, -38.13916015625, -36.841796875, -35.54443359375, -34.2470703125, -32.94970703125, -31.65234375, -30.35498046875, -29.0576171875, -27.76025390625, -26.462890625, -25.16552734375, -23.8681640625, -22.57080078125, -21.2734375, -19.97607421875, -18.6787109375, -17.38134765625, -16.083984375, -14.78662109375, -13.4892578125, -12.19189453125, -10.89453125, -9.59716796875, -8.2998046875, -7.00244140625, -5.705078125, -4.40771484375, -3.1103515625, -1.81298828125, -0.515625, 0.78173828125, 2.0791015625, 3.37646484375, 4.673828125, 5.97119140625, 7.2685546875, 8.56591796875, 9.86328125, 11.16064453125, 12.4580078125, 13.75537109375, 15.052734375, 16.35009765625, 17.6474609375, 18.94482421875, 20.2421875, 21.53955078125, 22.8369140625, 24.13427734375, 25.431640625, 26.72900390625, 28.0263671875, 29.32373046875, 30.62109375, 31.91845703125, 33.2158203125, 34.51318359375, 35.810546875, 37.10791015625, 38.4052734375, 39.70263671875, 41.0]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 10.0, 17.0, 29.0, 34.0, 56.0, 78.0, 95.0, 159.0, 204.0, 285.0, 347.0, 502.0, 665.0, 986.0, 1251.0, 1753.0, 2535.0, 3717.0, 5374.0, 7911.0, 11953.0, 19183.0, 32719.0, 62821.0, 170300.0, 5690245.0, 138956.0, 55929.0, 29859.0, 17584.0, 11259.0, 7571.0, 4891.0, 3514.0, 2383.0, 1702.0, 1261.0, 873.0, 648.0, 495.0, 350.0, 295.0, 201.0, 126.0, 105.0, 74.0, 36.0, 32.0, 23.0, 9.0, 9.0, 3.0, 5.0, 4.0, 7.0, 6.0, 3.0], "bins": [-18.59375, -18.020263671875, -17.44677734375, -16.873291015625, -16.2998046875, -15.726318359375, -15.15283203125, -14.579345703125, -14.005859375, -13.432373046875, -12.85888671875, -12.285400390625, -11.7119140625, -11.138427734375, -10.56494140625, -9.991455078125, -9.41796875, -8.844482421875, -8.27099609375, -7.697509765625, -7.1240234375, -6.550537109375, -5.97705078125, -5.403564453125, -4.830078125, -4.256591796875, -3.68310546875, -3.109619140625, -2.5361328125, -1.962646484375, -1.38916015625, -0.815673828125, -0.2421875, 0.331298828125, 0.90478515625, 1.478271484375, 2.0517578125, 2.625244140625, 3.19873046875, 3.772216796875, 4.345703125, 4.919189453125, 5.49267578125, 6.066162109375, 6.6396484375, 7.213134765625, 7.78662109375, 8.360107421875, 8.93359375, 9.507080078125, 10.08056640625, 10.654052734375, 11.2275390625, 11.801025390625, 12.37451171875, 12.947998046875, 13.521484375, 14.094970703125, 14.66845703125, 15.241943359375, 15.8154296875, 16.388916015625, 16.96240234375, 17.535888671875, 18.109375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 7.0, 13.0, 8.0, 12.0, 16.0, 16.0, 13.0, 15.0, 26.0, 20.0, 33.0, 29.0, 25.0, 31.0, 33.0, 28.0, 43.0, 38.0, 85.0, 559.0, 421.0, 97.0, 46.0, 35.0, 39.0, 35.0, 30.0, 25.0, 31.0, 28.0, 24.0, 26.0, 24.0, 23.0, 2.0, 14.0, 14.0, 9.0, 8.0, 10.0, 7.0, 2.0, 6.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-25.53125, -24.704833984375, -23.87841796875, -23.052001953125, -22.2255859375, -21.399169921875, -20.57275390625, -19.746337890625, -18.919921875, -18.093505859375, -17.26708984375, -16.440673828125, -15.6142578125, -14.787841796875, -13.96142578125, -13.135009765625, -12.30859375, -11.482177734375, -10.65576171875, -9.829345703125, -9.0029296875, -8.176513671875, -7.35009765625, -6.523681640625, -5.697265625, -4.870849609375, -4.04443359375, -3.218017578125, -2.3916015625, -1.565185546875, -0.73876953125, 0.087646484375, 0.9140625, 1.740478515625, 2.56689453125, 3.393310546875, 4.2197265625, 5.046142578125, 5.87255859375, 6.698974609375, 7.525390625, 8.351806640625, 9.17822265625, 10.004638671875, 10.8310546875, 11.657470703125, 12.48388671875, 13.310302734375, 14.13671875, 14.963134765625, 15.78955078125, 16.615966796875, 17.4423828125, 18.268798828125, 19.09521484375, 19.921630859375, 20.748046875, 21.574462890625, 22.40087890625, 23.227294921875, 24.0537109375, 24.880126953125, 25.70654296875, 26.532958984375, 27.359375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 2.0, 7.0, 14.0, 19.0, 33.0, 73.0, 145.0, 259.0, 220.0, 98.0, 54.0, 27.0, 18.0, 9.0, 13.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-155.717529296875, -152.6497039794922, -149.58187866210938, -146.51405334472656, -143.44622802734375, -140.37841796875, -137.31057739257812, -134.24276733398438, -131.17494201660156, -128.10711669921875, -125.03929138183594, -121.97146606445312, -118.90364837646484, -115.83582305908203, -112.76799774169922, -109.7001724243164, -106.6323471069336, -103.56452178955078, -100.49669647216797, -97.42887878417969, -94.36105346679688, -91.29322814941406, -88.22540283203125, -85.15757751464844, -82.08975219726562, -79.02192687988281, -75.9541015625, -72.88627624511719, -69.8184585571289, -66.7506332397461, -63.68280792236328, -60.61498260498047, -57.54717254638672, -54.479347229003906, -51.41152572631836, -48.34370040893555, -45.27587890625, -42.20805358886719, -39.140228271484375, -36.07240295410156, -33.004581451416016, -29.936758041381836, -26.868934631347656, -23.801109313964844, -20.733285903930664, -17.665462493896484, -14.597637176513672, -11.529813766479492, -8.461990356445312, -5.394166469573975, -2.3263425827026367, 0.7414817810058594, 3.809305191040039, 6.877128601074219, 9.944953918457031, 13.012777328491211, 16.08060073852539, 19.14842414855957, 22.21624755859375, 25.284072875976562, 28.351896286010742, 31.419719696044922, 34.487545013427734, 37.55536651611328, 40.623191833496094]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 4.0, 2.0, 16.0, 13.0, 10.0, 16.0, 27.0, 18.0, 18.0, 31.0, 40.0, 34.0, 48.0, 43.0, 49.0, 45.0, 47.0, 43.0, 46.0, 53.0, 43.0, 46.0, 33.0, 40.0, 40.0, 26.0, 30.0, 21.0, 17.0, 26.0, 11.0, 13.0, 12.0, 13.0, 9.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.001197814941406, -38.545654296875, -37.090110778808594, -35.63456726074219, -34.17902374267578, -32.723480224609375, -31.267934799194336, -29.81239128112793, -28.356847763061523, -26.901304244995117, -25.44576072692871, -23.990215301513672, -22.534671783447266, -21.07912826538086, -19.623584747314453, -18.168041229248047, -16.71249771118164, -15.256954193115234, -13.801410675048828, -12.345866203308105, -10.8903226852417, -9.434779167175293, -7.97923469543457, -6.523691177368164, -5.068147659301758, -3.6126039028167725, -2.157060146331787, -0.7015161514282227, 0.7540273666381836, 2.20957088470459, 3.6651153564453125, 5.120658874511719, 6.576202392578125, 8.031745910644531, 9.487289428710938, 10.94283390045166, 12.398377418518066, 13.853920936584473, 15.309465408325195, 16.7650089263916, 18.220552444458008, 19.676095962524414, 21.13163948059082, 22.58718490600586, 24.042728424072266, 25.498271942138672, 26.953815460205078, 28.409358978271484, 29.86490249633789, 31.320446014404297, 32.7759895324707, 34.23153305053711, 35.687076568603516, 37.14262008666992, 38.598167419433594, 40.0537109375, 41.509254455566406, 42.96479797363281, 44.42034149169922, 45.875885009765625, 47.33142852783203, 48.78697204589844, 50.242515563964844, 51.69805908203125, 53.153602600097656]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 2.0, 11.0, 11.0, 19.0, 27.0, 42.0, 58.0, 87.0, 134.0, 174.0, 314.0, 438.0, 755.0, 1106.0, 1861.0, 3538.0, 7674.0, 21563.0, 573098.0, 3535171.0, 25993.0, 9891.0, 4750.0, 2681.0, 1622.0, 1030.0, 708.0, 445.0, 297.0, 200.0, 148.0, 89.0, 89.0, 62.0, 38.0, 51.0, 24.0, 22.0, 19.0, 11.0, 6.0, 3.0, 6.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8544921875, -1.7804107666015625, -1.706329345703125, -1.6322479248046875, -1.55816650390625, -1.4840850830078125, -1.410003662109375, -1.3359222412109375, -1.2618408203125, -1.1877593994140625, -1.113677978515625, -1.0395965576171875, -0.96551513671875, -0.8914337158203125, -0.817352294921875, -0.7432708740234375, -0.669189453125, -0.5951080322265625, -0.521026611328125, -0.4469451904296875, -0.37286376953125, -0.2987823486328125, -0.224700927734375, -0.1506195068359375, -0.0765380859375, -0.0024566650390625, 0.071624755859375, 0.1457061767578125, 0.21978759765625, 0.2938690185546875, 0.367950439453125, 0.4420318603515625, 0.51611328125, 0.5901947021484375, 0.664276123046875, 0.7383575439453125, 0.81243896484375, 0.8865203857421875, 0.960601806640625, 1.0346832275390625, 1.1087646484375, 1.1828460693359375, 1.256927490234375, 1.3310089111328125, 1.40509033203125, 1.4791717529296875, 1.553253173828125, 1.6273345947265625, 1.701416015625, 1.7754974365234375, 1.849578857421875, 1.9236602783203125, 1.99774169921875, 2.0718231201171875, 2.145904541015625, 2.2199859619140625, 2.2940673828125, 2.3681488037109375, 2.442230224609375, 2.5163116455078125, 2.59039306640625, 2.6644744873046875, 2.738555908203125, 2.8126373291015625, 2.88671875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 6.0, 7.0, 12.0, 19.0, 18.0, 15.0, 363.0, 434.0, 21.0, 12.0, 13.0, 11.0, 6.0, 13.0, 4.0, 3.0, 5.0, 0.0, 4.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.303466796875, -0.2914314270019531, -0.27939605712890625, -0.2673606872558594, -0.2553253173828125, -0.24328994750976562, -0.23125457763671875, -0.21921920776367188, -0.207183837890625, -0.19514846801757812, -0.18311309814453125, -0.17107772827148438, -0.1590423583984375, -0.14700698852539062, -0.13497161865234375, -0.12293624877929688, -0.11090087890625, -0.09886550903320312, -0.08683013916015625, -0.07479476928710938, -0.0627593994140625, -0.050724029541015625, -0.03868865966796875, -0.026653289794921875, -0.014617919921875, -0.002582550048828125, 0.00945281982421875, 0.021488189697265625, 0.0335235595703125, 0.045558929443359375, 0.05759429931640625, 0.06962966918945312, 0.0816650390625, 0.09370040893554688, 0.10573577880859375, 0.11777114868164062, 0.1298065185546875, 0.14184188842773438, 0.15387725830078125, 0.16591262817382812, 0.177947998046875, 0.18998336791992188, 0.20201873779296875, 0.21405410766601562, 0.2260894775390625, 0.23812484741210938, 0.25016021728515625, 0.2621955871582031, 0.27423095703125, 0.2862663269042969, 0.29830169677734375, 0.3103370666503906, 0.3223724365234375, 0.3344078063964844, 0.34644317626953125, 0.3584785461425781, 0.370513916015625, 0.3825492858886719, 0.39458465576171875, 0.4066200256347656, 0.4186553955078125, 0.4306907653808594, 0.44272613525390625, 0.4547615051269531, 0.466796875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 9.0, 2.0, 9.0, 5.0, 6.0, 17.0, 26.0, 30.0, 48.0, 75.0, 91.0, 169.0, 220.0, 314.0, 532.0, 779.0, 1248.0, 1943.0, 3145.0, 5297.0, 8956.0, 15771.0, 29099.0, 60383.0, 161953.0, 2438483.0, 1202324.0, 141478.0, 56460.0, 27471.0, 15175.0, 8682.0, 5255.0, 3170.0, 2034.0, 1207.0, 820.0, 530.0, 369.0, 213.0, 157.0, 114.0, 63.0, 48.0, 39.0, 27.0, 11.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0], "bins": [-1.373046875, -1.3325958251953125, -1.292144775390625, -1.2516937255859375, -1.21124267578125, -1.1707916259765625, -1.130340576171875, -1.0898895263671875, -1.0494384765625, -1.0089874267578125, -0.968536376953125, -0.9280853271484375, -0.88763427734375, -0.8471832275390625, -0.806732177734375, -0.7662811279296875, -0.725830078125, -0.6853790283203125, -0.644927978515625, -0.6044769287109375, -0.56402587890625, -0.5235748291015625, -0.483123779296875, -0.4426727294921875, -0.4022216796875, -0.3617706298828125, -0.321319580078125, -0.2808685302734375, -0.24041748046875, -0.1999664306640625, -0.159515380859375, -0.1190643310546875, -0.07861328125, -0.0381622314453125, 0.002288818359375, 0.0427398681640625, 0.08319091796875, 0.1236419677734375, 0.164093017578125, 0.2045440673828125, 0.2449951171875, 0.2854461669921875, 0.325897216796875, 0.3663482666015625, 0.40679931640625, 0.4472503662109375, 0.487701416015625, 0.5281524658203125, 0.568603515625, 0.6090545654296875, 0.649505615234375, 0.6899566650390625, 0.73040771484375, 0.7708587646484375, 0.811309814453125, 0.8517608642578125, 0.8922119140625, 0.9326629638671875, 0.973114013671875, 1.0135650634765625, 1.05401611328125, 1.0944671630859375, 1.134918212890625, 1.1753692626953125, 1.2158203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 7.0, 4.0, 8.0, 7.0, 6.0, 19.0, 19.0, 25.0, 31.0, 45.0, 53.0, 53.0, 85.0, 141.0, 256.0, 1370.0, 1167.0, 250.0, 127.0, 89.0, 62.0, 39.0, 47.0, 29.0, 31.0, 21.0, 19.0, 13.0, 11.0, 4.0, 12.0, 9.0, 3.0, 5.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.66845703125, -0.6493377685546875, -0.630218505859375, -0.6110992431640625, -0.59197998046875, -0.5728607177734375, -0.553741455078125, -0.5346221923828125, -0.5155029296875, -0.4963836669921875, -0.477264404296875, -0.4581451416015625, -0.43902587890625, -0.4199066162109375, -0.400787353515625, -0.3816680908203125, -0.362548828125, -0.3434295654296875, -0.324310302734375, -0.3051910400390625, -0.28607177734375, -0.2669525146484375, -0.247833251953125, -0.2287139892578125, -0.2095947265625, -0.1904754638671875, -0.171356201171875, -0.1522369384765625, -0.13311767578125, -0.1139984130859375, -0.094879150390625, -0.0757598876953125, -0.056640625, -0.0375213623046875, -0.018402099609375, 0.0007171630859375, 0.01983642578125, 0.0389556884765625, 0.058074951171875, 0.0771942138671875, 0.0963134765625, 0.1154327392578125, 0.134552001953125, 0.1536712646484375, 0.17279052734375, 0.1919097900390625, 0.211029052734375, 0.2301483154296875, 0.249267578125, 0.2683868408203125, 0.287506103515625, 0.3066253662109375, 0.32574462890625, 0.3448638916015625, 0.363983154296875, 0.3831024169921875, 0.4022216796875, 0.4213409423828125, 0.440460205078125, 0.4595794677734375, 0.47869873046875, 0.4978179931640625, 0.516937255859375, 0.5360565185546875, 0.55517578125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 3.0, 11.0, 8.0, 15.0, 17.0, 17.0, 31.0, 45.0, 62.0, 92.0, 127.0, 153.0, 127.0, 81.0, 58.0, 48.0, 28.0, 21.0, 16.0, 9.0, 10.0, 10.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.653794050216675, -2.568696975708008, -2.483599901199341, -2.398502826690674, -2.313405752182007, -2.22830867767334, -2.1432113647460938, -2.058114528656006, -1.9730173349380493, -1.8879202604293823, -1.8028231859207153, -1.7177259922027588, -1.6326289176940918, -1.5475318431854248, -1.4624347686767578, -1.3773376941680908, -1.2922406196594238, -1.2071435451507568, -1.1220464706420898, -1.0369493961334229, -0.9518522620201111, -0.8667551875114441, -0.7816580533981323, -0.6965609788894653, -0.6114639043807983, -0.5263668298721313, -0.44126972556114197, -0.3561726212501526, -0.2710755467414856, -0.1859784722328186, -0.10088133811950684, -0.015784263610839844, 0.06931257247924805, 0.15440966188907623, 0.23950675129890442, 0.3246038556098938, 0.4097009301185608, 0.4947980046272278, 0.5798951387405396, 0.6649922132492065, 0.7500892877578735, 0.8351863622665405, 0.9202834367752075, 1.005380630493164, 1.090477705001831, 1.175574779510498, 1.260671854019165, 1.345768928527832, 1.430866003036499, 1.515963077545166, 1.601060152053833, 1.6861572265625, 1.771254301071167, 1.856351375579834, 1.9414485692977905, 2.026545524597168, 2.111642837524414, 2.196739912033081, 2.281836986541748, 2.366934061050415, 2.452031135559082, 2.537128210067749, 2.622225284576416, 2.707322597503662, 2.79241943359375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 3.0, 4.0, 5.0, 7.0, 8.0, 16.0, 14.0, 18.0, 27.0, 28.0, 37.0, 40.0, 47.0, 44.0, 60.0, 62.0, 59.0, 65.0, 52.0, 53.0, 46.0, 60.0, 45.0, 32.0, 44.0, 23.0, 20.0, 16.0, 14.0, 11.0, 7.0, 5.0, 10.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0711510181427, -2.000272035598755, -1.9293930530548096, -1.8585140705108643, -1.787635087966919, -1.7167561054229736, -1.6458772420883179, -1.5749982595443726, -1.5041192770004272, -1.433240294456482, -1.3623613119125366, -1.2914823293685913, -1.2206034660339355, -1.1497244834899902, -1.078845500946045, -1.0079665184020996, -0.9370875358581543, -0.866208553314209, -0.7953295707702637, -0.7244506478309631, -0.6535716652870178, -0.5826926827430725, -0.511813759803772, -0.44093477725982666, -0.37005579471588135, -0.29917681217193604, -0.2282978594303131, -0.157418891787529, -0.08653992414474487, -0.01566094160079956, 0.055218011140823364, 0.1260969638824463, 0.1969759464263916, 0.2678549289703369, 0.33873388171195984, 0.40961283445358276, 0.4804918169975281, 0.5513707995414734, 0.6222497224807739, 0.6931287050247192, 0.7640076875686646, 0.8348866701126099, 0.9057656526565552, 0.9766445755958557, 1.0475234985351562, 1.1184024810791016, 1.1892814636230469, 1.2601604461669922, 1.3310394287109375, 1.4019184112548828, 1.4727973937988281, 1.5436763763427734, 1.6145553588867188, 1.685434341430664, 1.7563132047653198, 1.8271921873092651, 1.8980711698532104, 1.9689501523971558, 2.0398290157318115, 2.110707998275757, 2.181586980819702, 2.2524659633636475, 2.3233449459075928, 2.394223928451538, 2.4651029109954834]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 8.0, 18.0, 13.0, 18.0, 33.0, 40.0, 48.0, 78.0, 145.0, 209.0, 345.0, 566.0, 1037.0, 1887.0, 3606.0, 7264.0, 17612.0, 174145.0, 797181.0, 25415.0, 9197.0, 4308.0, 2327.0, 1268.0, 688.0, 370.0, 238.0, 159.0, 95.0, 57.0, 49.0, 38.0, 24.0, 21.0, 15.0, 8.0, 1.0, 2.0, 3.0, 8.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.421875, -2.346527099609375, -2.27117919921875, -2.195831298828125, -2.1204833984375, -2.045135498046875, -1.96978759765625, -1.894439697265625, -1.819091796875, -1.743743896484375, -1.66839599609375, -1.593048095703125, -1.5177001953125, -1.442352294921875, -1.36700439453125, -1.291656494140625, -1.21630859375, -1.140960693359375, -1.06561279296875, -0.990264892578125, -0.9149169921875, -0.839569091796875, -0.76422119140625, -0.688873291015625, -0.613525390625, -0.538177490234375, -0.46282958984375, -0.387481689453125, -0.3121337890625, -0.236785888671875, -0.16143798828125, -0.086090087890625, -0.0107421875, 0.064605712890625, 0.13995361328125, 0.215301513671875, 0.2906494140625, 0.365997314453125, 0.44134521484375, 0.516693115234375, 0.592041015625, 0.667388916015625, 0.74273681640625, 0.818084716796875, 0.8934326171875, 0.968780517578125, 1.04412841796875, 1.119476318359375, 1.19482421875, 1.270172119140625, 1.34552001953125, 1.420867919921875, 1.4962158203125, 1.571563720703125, 1.64691162109375, 1.722259521484375, 1.797607421875, 1.872955322265625, 1.94830322265625, 2.023651123046875, 2.0989990234375, 2.174346923828125, 2.24969482421875, 2.325042724609375, 2.400390625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 6.0, 8.0, 5.0, 7.0, 16.0, 24.0, 76.0, 265.0, 359.0, 121.0, 22.0, 14.0, 17.0, 7.0, 4.0, 10.0, 4.0, 4.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.290283203125, -0.27837371826171875, -0.2664642333984375, -0.25455474853515625, -0.242645263671875, -0.23073577880859375, -0.2188262939453125, -0.20691680908203125, -0.19500732421875, -0.18309783935546875, -0.1711883544921875, -0.15927886962890625, -0.147369384765625, -0.13545989990234375, -0.1235504150390625, -0.11164093017578125, -0.0997314453125, -0.08782196044921875, -0.0759124755859375, -0.06400299072265625, -0.052093505859375, -0.04018402099609375, -0.0282745361328125, -0.01636505126953125, -0.00445556640625, 0.00745391845703125, 0.0193634033203125, 0.03127288818359375, 0.043182373046875, 0.05509185791015625, 0.0670013427734375, 0.07891082763671875, 0.0908203125, 0.10272979736328125, 0.1146392822265625, 0.12654876708984375, 0.138458251953125, 0.15036773681640625, 0.1622772216796875, 0.17418670654296875, 0.18609619140625, 0.19800567626953125, 0.2099151611328125, 0.22182464599609375, 0.233734130859375, 0.24564361572265625, 0.2575531005859375, 0.26946258544921875, 0.2813720703125, 0.29328155517578125, 0.3051910400390625, 0.31710052490234375, 0.329010009765625, 0.34091949462890625, 0.3528289794921875, 0.36473846435546875, 0.37664794921875, 0.38855743408203125, 0.4004669189453125, 0.41237640380859375, 0.424285888671875, 0.43619537353515625, 0.4481048583984375, 0.46001434326171875, 0.471923828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 7.0, 15.0, 27.0, 36.0, 72.0, 129.0, 247.0, 528.0, 1101.0, 2429.0, 6540.0, 20376.0, 78535.0, 576067.0, 288978.0, 51090.0, 14042.0, 4745.0, 1906.0, 799.0, 400.0, 203.0, 137.0, 69.0, 37.0, 20.0, 8.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8759765625, -1.8004913330078125, -1.725006103515625, -1.6495208740234375, -1.57403564453125, -1.4985504150390625, -1.423065185546875, -1.3475799560546875, -1.2720947265625, -1.1966094970703125, -1.121124267578125, -1.0456390380859375, -0.97015380859375, -0.8946685791015625, -0.819183349609375, -0.7436981201171875, -0.668212890625, -0.5927276611328125, -0.517242431640625, -0.4417572021484375, -0.36627197265625, -0.2907867431640625, -0.215301513671875, -0.1398162841796875, -0.0643310546875, 0.0111541748046875, 0.086639404296875, 0.1621246337890625, 0.23760986328125, 0.3130950927734375, 0.388580322265625, 0.4640655517578125, 0.53955078125, 0.6150360107421875, 0.690521240234375, 0.7660064697265625, 0.84149169921875, 0.9169769287109375, 0.992462158203125, 1.0679473876953125, 1.1434326171875, 1.2189178466796875, 1.294403076171875, 1.3698883056640625, 1.44537353515625, 1.5208587646484375, 1.596343994140625, 1.6718292236328125, 1.747314453125, 1.8227996826171875, 1.898284912109375, 1.9737701416015625, 2.04925537109375, 2.1247406005859375, 2.200225830078125, 2.2757110595703125, 2.3511962890625, 2.4266815185546875, 2.502166748046875, 2.5776519775390625, 2.65313720703125, 2.7286224365234375, 2.804107666015625, 2.8795928955078125, 2.955078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 9.0, 4.0, 9.0, 6.0, 6.0, 10.0, 12.0, 10.0, 28.0, 34.0, 20.0, 20.0, 30.0, 35.0, 34.0, 37.0, 36.0, 40.0, 38.0, 34.0, 43.0, 42.0, 48.0, 39.0, 45.0, 49.0, 49.0, 43.0, 24.0, 24.0, 17.0, 23.0, 24.0, 11.0, 10.0, 14.0, 10.0, 10.0, 5.0, 4.0, 2.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.26953125, -1.2282562255859375, -1.186981201171875, -1.1457061767578125, -1.10443115234375, -1.0631561279296875, -1.021881103515625, -0.9806060791015625, -0.9393310546875, -0.8980560302734375, -0.856781005859375, -0.8155059814453125, -0.77423095703125, -0.7329559326171875, -0.691680908203125, -0.6504058837890625, -0.609130859375, -0.5678558349609375, -0.526580810546875, -0.4853057861328125, -0.44403076171875, -0.4027557373046875, -0.361480712890625, -0.3202056884765625, -0.2789306640625, -0.2376556396484375, -0.196380615234375, -0.1551055908203125, -0.11383056640625, -0.0725555419921875, -0.031280517578125, 0.0099945068359375, 0.05126953125, 0.0925445556640625, 0.133819580078125, 0.1750946044921875, 0.21636962890625, 0.2576446533203125, 0.298919677734375, 0.3401947021484375, 0.3814697265625, 0.4227447509765625, 0.464019775390625, 0.5052947998046875, 0.54656982421875, 0.5878448486328125, 0.629119873046875, 0.6703948974609375, 0.711669921875, 0.7529449462890625, 0.794219970703125, 0.8354949951171875, 0.87677001953125, 0.9180450439453125, 0.959320068359375, 1.0005950927734375, 1.0418701171875, 1.0831451416015625, 1.124420166015625, 1.1656951904296875, 1.20697021484375, 1.2482452392578125, 1.289520263671875, 1.3307952880859375, 1.3720703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 10.0, 13.0, 22.0, 25.0, 47.0, 79.0, 146.0, 308.0, 672.0, 1684.0, 5523.0, 33990.0, 842506.0, 146879.0, 11902.0, 2851.0, 1005.0, 418.0, 207.0, 103.0, 57.0, 36.0, 19.0, 15.0, 7.0, 6.0, 13.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.049957275390625, -1.96710205078125, -1.884246826171875, -1.8013916015625, -1.718536376953125, -1.63568115234375, -1.552825927734375, -1.469970703125, -1.387115478515625, -1.30426025390625, -1.221405029296875, -1.1385498046875, -1.055694580078125, -0.97283935546875, -0.889984130859375, -0.80712890625, -0.724273681640625, -0.64141845703125, -0.558563232421875, -0.4757080078125, -0.392852783203125, -0.30999755859375, -0.227142333984375, -0.144287109375, -0.061431884765625, 0.02142333984375, 0.104278564453125, 0.1871337890625, 0.269989013671875, 0.35284423828125, 0.435699462890625, 0.5185546875, 0.601409912109375, 0.68426513671875, 0.767120361328125, 0.8499755859375, 0.932830810546875, 1.01568603515625, 1.098541259765625, 1.181396484375, 1.264251708984375, 1.34710693359375, 1.429962158203125, 1.5128173828125, 1.595672607421875, 1.67852783203125, 1.761383056640625, 1.84423828125, 1.927093505859375, 2.00994873046875, 2.092803955078125, 2.1756591796875, 2.258514404296875, 2.34136962890625, 2.424224853515625, 2.507080078125, 2.589935302734375, 2.67279052734375, 2.755645751953125, 2.8385009765625, 2.921356201171875, 3.00421142578125, 3.087066650390625, 3.169921875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 7.0, 14.0, 9.0, 13.0, 23.0, 27.0, 38.0, 40.0, 80.0, 115.0, 133.0, 115.0, 114.0, 72.0, 65.0, 28.0, 32.0, 17.0, 15.0, 15.0, 14.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.547306060791016e-05, -8.206255733966827e-05, -7.865205407142639e-05, -7.524155080318451e-05, -7.183104753494263e-05, -6.842054426670074e-05, -6.501004099845886e-05, -6.159953773021698e-05, -5.81890344619751e-05, -5.4778531193733215e-05, -5.136802792549133e-05, -4.795752465724945e-05, -4.454702138900757e-05, -4.1136518120765686e-05, -3.7726014852523804e-05, -3.431551158428192e-05, -3.090500831604004e-05, -2.7494505047798157e-05, -2.4084001779556274e-05, -2.0673498511314392e-05, -1.726299524307251e-05, -1.3852491974830627e-05, -1.0441988706588745e-05, -7.031485438346863e-06, -3.6209821701049805e-06, -2.1047890186309814e-07, 3.200024366378784e-06, 6.6105276346206665e-06, 1.0021030902862549e-05, 1.3431534171104431e-05, 1.6842037439346313e-05, 2.0252540707588196e-05, 2.3663043975830078e-05, 2.707354724407196e-05, 3.0484050512313843e-05, 3.3894553780555725e-05, 3.730505704879761e-05, 4.071556031703949e-05, 4.412606358528137e-05, 4.7536566853523254e-05, 5.094707012176514e-05, 5.435757339000702e-05, 5.77680766582489e-05, 6.117857992649078e-05, 6.458908319473267e-05, 6.799958646297455e-05, 7.141008973121643e-05, 7.482059299945831e-05, 7.82310962677002e-05, 8.164159953594208e-05, 8.505210280418396e-05, 8.846260607242584e-05, 9.187310934066772e-05, 9.528361260890961e-05, 9.869411587715149e-05, 0.00010210461914539337, 0.00010551512241363525, 0.00010892562568187714, 0.00011233612895011902, 0.0001157466322183609, 0.00011915713548660278, 0.00012256763875484467, 0.00012597814202308655, 0.00012938864529132843, 0.0001327991485595703]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 6.0, 4.0, 9.0, 10.0, 16.0, 16.0, 23.0, 25.0, 44.0, 41.0, 67.0, 100.0, 125.0, 180.0, 282.0, 427.0, 635.0, 1006.0, 1834.0, 3315.0, 6653.0, 15258.0, 43878.0, 198516.0, 606747.0, 115521.0, 30304.0, 11343.0, 5242.0, 2687.0, 1523.0, 901.0, 577.0, 349.0, 261.0, 188.0, 130.0, 85.0, 56.0, 42.0, 31.0, 24.0, 15.0, 19.0, 6.0, 12.0, 4.0, 7.0, 3.0, 5.0, 1.0, 4.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.095703125, -1.06182861328125, -1.0279541015625, -0.99407958984375, -0.960205078125, -0.92633056640625, -0.8924560546875, -0.85858154296875, -0.82470703125, -0.79083251953125, -0.7569580078125, -0.72308349609375, -0.689208984375, -0.65533447265625, -0.6214599609375, -0.58758544921875, -0.5537109375, -0.51983642578125, -0.4859619140625, -0.45208740234375, -0.418212890625, -0.38433837890625, -0.3504638671875, -0.31658935546875, -0.28271484375, -0.24884033203125, -0.2149658203125, -0.18109130859375, -0.147216796875, -0.11334228515625, -0.0794677734375, -0.04559326171875, -0.01171875, 0.02215576171875, 0.0560302734375, 0.08990478515625, 0.123779296875, 0.15765380859375, 0.1915283203125, 0.22540283203125, 0.25927734375, 0.29315185546875, 0.3270263671875, 0.36090087890625, 0.394775390625, 0.42864990234375, 0.4625244140625, 0.49639892578125, 0.5302734375, 0.56414794921875, 0.5980224609375, 0.63189697265625, 0.665771484375, 0.69964599609375, 0.7335205078125, 0.76739501953125, 0.80126953125, 0.83514404296875, 0.8690185546875, 0.90289306640625, 0.936767578125, 0.97064208984375, 1.0045166015625, 1.03839111328125, 1.072265625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 9.0, 11.0, 15.0, 10.0, 33.0, 33.0, 42.0, 52.0, 52.0, 76.0, 85.0, 100.0, 93.0, 91.0, 70.0, 63.0, 38.0, 27.0, 29.0, 14.0, 13.0, 11.0, 3.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0126953125, -0.9787750244140625, -0.944854736328125, -0.9109344482421875, -0.87701416015625, -0.8430938720703125, -0.809173583984375, -0.7752532958984375, -0.7413330078125, -0.7074127197265625, -0.673492431640625, -0.6395721435546875, -0.60565185546875, -0.5717315673828125, -0.537811279296875, -0.5038909912109375, -0.469970703125, -0.4360504150390625, -0.402130126953125, -0.3682098388671875, -0.33428955078125, -0.3003692626953125, -0.266448974609375, -0.2325286865234375, -0.1986083984375, -0.1646881103515625, -0.130767822265625, -0.0968475341796875, -0.06292724609375, -0.0290069580078125, 0.004913330078125, 0.0388336181640625, 0.07275390625, 0.1066741943359375, 0.140594482421875, 0.1745147705078125, 0.20843505859375, 0.2423553466796875, 0.276275634765625, 0.3101959228515625, 0.3441162109375, 0.3780364990234375, 0.411956787109375, 0.4458770751953125, 0.47979736328125, 0.5137176513671875, 0.547637939453125, 0.5815582275390625, 0.615478515625, 0.6493988037109375, 0.683319091796875, 0.7172393798828125, 0.75115966796875, 0.7850799560546875, 0.819000244140625, 0.8529205322265625, 0.8868408203125, 0.9207611083984375, 0.954681396484375, 0.9886016845703125, 1.02252197265625, 1.0564422607421875, 1.090362548828125, 1.1242828369140625, 1.158203125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 11.0, 13.0, 35.0, 90.0, 375.0, 296.0, 94.0, 44.0, 22.0, 7.0, 7.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.14950942993164, -29.260095596313477, -28.370681762695312, -27.48126792907715, -26.591854095458984, -25.70244026184082, -24.813026428222656, -23.923612594604492, -23.034198760986328, -22.144784927368164, -21.25537109375, -20.365957260131836, -19.476543426513672, -18.587129592895508, -17.697715759277344, -16.80830192565918, -15.918888092041016, -15.029474258422852, -14.140060424804688, -13.250646591186523, -12.36123275756836, -11.471818923950195, -10.582405090332031, -9.692991256713867, -8.803577423095703, -7.914163589477539, -7.024749755859375, -6.135335922241211, -5.245922088623047, -4.356508255004883, -3.4670944213867188, -2.5776805877685547, -1.6882667541503906, -0.7988529205322266, 0.0905609130859375, 0.9799747467041016, 1.8693885803222656, 2.7588024139404297, 3.6482162475585938, 4.537630081176758, 5.427043914794922, 6.316457748413086, 7.20587158203125, 8.095285415649414, 8.984699249267578, 9.874113082885742, 10.763526916503906, 11.65294075012207, 12.542354583740234, 13.431768417358398, 14.321182250976562, 15.210596084594727, 16.10000991821289, 16.989423751831055, 17.87883758544922, 18.768251419067383, 19.657665252685547, 20.54707908630371, 21.436492919921875, 22.32590675354004, 23.215320587158203, 24.104734420776367, 24.99414825439453, 25.883562088012695, 26.77297592163086]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 0.0, 6.0, 3.0, 8.0, 10.0, 14.0, 14.0, 48.0, 101.0, 144.0, 220.0, 180.0, 114.0, 49.0, 22.0, 20.0, 13.0, 7.0, 7.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.57391357421875, -39.54993438720703, -38.52595520019531, -37.501976013183594, -36.477996826171875, -35.454017639160156, -34.43003845214844, -33.40605926513672, -32.382080078125, -31.35810089111328, -30.334121704101562, -29.310142517089844, -28.286163330078125, -27.262184143066406, -26.238203048706055, -25.214223861694336, -24.190242767333984, -23.166263580322266, -22.142284393310547, -21.118305206298828, -20.09432601928711, -19.07034683227539, -18.04636573791504, -17.02238655090332, -15.998407363891602, -14.974428176879883, -13.950448989868164, -12.926468849182129, -11.90248966217041, -10.878510475158691, -9.854530334472656, -8.830551147460938, -7.806571960449219, -6.7825927734375, -5.758613109588623, -4.734633445739746, -3.7106542587280273, -2.6866750717163086, -1.6626954078674316, -0.6387157440185547, 0.38526344299316406, 1.409242868423462, 2.4332222938537598, 3.4572017192840576, 4.4811811447143555, 5.505160331726074, 6.529139995574951, 7.553119659423828, 8.577098846435547, 9.601078033447266, 10.625057220458984, 11.64903736114502, 12.673016548156738, 13.696995735168457, 14.720975875854492, 15.744955062866211, 16.76893424987793, 17.79291343688965, 18.816892623901367, 19.840871810913086, 20.864852905273438, 21.888832092285156, 22.912811279296875, 23.936790466308594, 24.960769653320312]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 3.0, 8.0, 9.0, 16.0, 28.0, 31.0, 42.0, 69.0, 88.0, 142.0, 217.0, 362.0, 623.0, 1185.0, 2591.0, 6223.0, 23786.0, 3942752.0, 192559.0, 15082.0, 4688.0, 1889.0, 888.0, 437.0, 213.0, 122.0, 72.0, 53.0, 34.0, 14.0, 14.0, 9.0, 8.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5703125, -7.36480712890625, -7.1593017578125, -6.95379638671875, -6.748291015625, -6.54278564453125, -6.3372802734375, -6.13177490234375, -5.92626953125, -5.72076416015625, -5.5152587890625, -5.30975341796875, -5.104248046875, -4.89874267578125, -4.6932373046875, -4.48773193359375, -4.2822265625, -4.07672119140625, -3.8712158203125, -3.66571044921875, -3.460205078125, -3.25469970703125, -3.0491943359375, -2.84368896484375, -2.63818359375, -2.43267822265625, -2.2271728515625, -2.02166748046875, -1.816162109375, -1.61065673828125, -1.4051513671875, -1.19964599609375, -0.994140625, -0.78863525390625, -0.5831298828125, -0.37762451171875, -0.172119140625, 0.03338623046875, 0.2388916015625, 0.44439697265625, 0.64990234375, 0.85540771484375, 1.0609130859375, 1.26641845703125, 1.471923828125, 1.67742919921875, 1.8829345703125, 2.08843994140625, 2.2939453125, 2.49945068359375, 2.7049560546875, 2.91046142578125, 3.115966796875, 3.32147216796875, 3.5269775390625, 3.73248291015625, 3.93798828125, 4.14349365234375, 4.3489990234375, 4.55450439453125, 4.760009765625, 4.96551513671875, 5.1710205078125, 5.37652587890625, 5.58203125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 3.0, 3.0, 7.0, 6.0, 4.0, 5.0, 11.0, 11.0, 22.0, 47.0, 122.0, 228.0, 255.0, 119.0, 56.0, 28.0, 14.0, 12.0, 11.0, 11.0, 2.0, 5.0, 3.0, 5.0, 2.0, 5.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49951171875, -0.486724853515625, -0.47393798828125, -0.461151123046875, -0.4483642578125, -0.435577392578125, -0.42279052734375, -0.410003662109375, -0.397216796875, -0.384429931640625, -0.37164306640625, -0.358856201171875, -0.3460693359375, -0.333282470703125, -0.32049560546875, -0.307708740234375, -0.294921875, -0.282135009765625, -0.26934814453125, -0.256561279296875, -0.2437744140625, -0.230987548828125, -0.21820068359375, -0.205413818359375, -0.192626953125, -0.179840087890625, -0.16705322265625, -0.154266357421875, -0.1414794921875, -0.128692626953125, -0.11590576171875, -0.103118896484375, -0.09033203125, -0.077545166015625, -0.06475830078125, -0.051971435546875, -0.0391845703125, -0.026397705078125, -0.01361083984375, -0.000823974609375, 0.011962890625, 0.024749755859375, 0.03753662109375, 0.050323486328125, 0.0631103515625, 0.075897216796875, 0.08868408203125, 0.101470947265625, 0.1142578125, 0.127044677734375, 0.13983154296875, 0.152618408203125, 0.1654052734375, 0.178192138671875, 0.19097900390625, 0.203765869140625, 0.216552734375, 0.229339599609375, 0.24212646484375, 0.254913330078125, 0.2677001953125, 0.280487060546875, 0.29327392578125, 0.306060791015625, 0.31884765625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 7.0, 6.0, 9.0, 12.0, 21.0, 17.0, 28.0, 43.0, 60.0, 77.0, 109.0, 160.0, 249.0, 363.0, 563.0, 832.0, 1252.0, 2344.0, 4114.0, 7896.0, 16942.0, 46338.0, 243040.0, 3636861.0, 164231.0, 37847.0, 14515.0, 7007.0, 3693.0, 2056.0, 1234.0, 763.0, 519.0, 304.0, 240.0, 154.0, 115.0, 69.0, 61.0, 25.0, 34.0, 20.0, 13.0, 17.0, 11.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.201171875, -3.1024169921875, -3.003662109375, -2.9049072265625, -2.80615234375, -2.7073974609375, -2.608642578125, -2.5098876953125, -2.4111328125, -2.3123779296875, -2.213623046875, -2.1148681640625, -2.01611328125, -1.9173583984375, -1.818603515625, -1.7198486328125, -1.62109375, -1.5223388671875, -1.423583984375, -1.3248291015625, -1.22607421875, -1.1273193359375, -1.028564453125, -0.9298095703125, -0.8310546875, -0.7322998046875, -0.633544921875, -0.5347900390625, -0.43603515625, -0.3372802734375, -0.238525390625, -0.1397705078125, -0.041015625, 0.0577392578125, 0.156494140625, 0.2552490234375, 0.35400390625, 0.4527587890625, 0.551513671875, 0.6502685546875, 0.7490234375, 0.8477783203125, 0.946533203125, 1.0452880859375, 1.14404296875, 1.2427978515625, 1.341552734375, 1.4403076171875, 1.5390625, 1.6378173828125, 1.736572265625, 1.8353271484375, 1.93408203125, 2.0328369140625, 2.131591796875, 2.2303466796875, 2.3291015625, 2.4278564453125, 2.526611328125, 2.6253662109375, 2.72412109375, 2.8228759765625, 2.921630859375, 3.0203857421875, 3.119140625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 1.0, 2.0, 4.0, 6.0, 5.0, 7.0, 6.0, 9.0, 15.0, 19.0, 19.0, 40.0, 59.0, 116.0, 195.0, 733.0, 2310.0, 227.0, 112.0, 55.0, 35.0, 25.0, 17.0, 11.0, 5.0, 9.0, 8.0, 5.0, 5.0, 8.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64599609375, -0.6259002685546875, -0.605804443359375, -0.5857086181640625, -0.56561279296875, -0.5455169677734375, -0.525421142578125, -0.5053253173828125, -0.4852294921875, -0.4651336669921875, -0.445037841796875, -0.4249420166015625, -0.40484619140625, -0.3847503662109375, -0.364654541015625, -0.3445587158203125, -0.324462890625, -0.3043670654296875, -0.284271240234375, -0.2641754150390625, -0.24407958984375, -0.2239837646484375, -0.203887939453125, -0.1837921142578125, -0.1636962890625, -0.1436004638671875, -0.123504638671875, -0.1034088134765625, -0.08331298828125, -0.0632171630859375, -0.043121337890625, -0.0230255126953125, -0.0029296875, 0.0171661376953125, 0.037261962890625, 0.0573577880859375, 0.07745361328125, 0.0975494384765625, 0.117645263671875, 0.1377410888671875, 0.1578369140625, 0.1779327392578125, 0.198028564453125, 0.2181243896484375, 0.23822021484375, 0.2583160400390625, 0.278411865234375, 0.2985076904296875, 0.318603515625, 0.3386993408203125, 0.358795166015625, 0.3788909912109375, 0.39898681640625, 0.4190826416015625, 0.439178466796875, 0.4592742919921875, 0.4793701171875, 0.4994659423828125, 0.519561767578125, 0.5396575927734375, 0.55975341796875, 0.5798492431640625, 0.599945068359375, 0.6200408935546875, 0.64013671875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 0.0, 6.0, 5.0, 3.0, 5.0, 16.0, 28.0, 43.0, 113.0, 216.0, 261.0, 162.0, 53.0, 40.0, 14.0, 15.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.686704158782959, -4.575982570648193, -4.465260982513428, -4.354539394378662, -4.2438178062438965, -4.133096218109131, -4.022374153137207, -3.9116528034210205, -3.800931215286255, -3.6902096271514893, -3.5794880390167236, -3.468766212463379, -3.3580446243286133, -3.2473230361938477, -3.136601448059082, -3.0258798599243164, -2.915158271789551, -2.804436683654785, -2.6937150955200195, -2.582993507385254, -2.472271680831909, -2.3615500926971436, -2.250828504562378, -2.1401069164276123, -2.0293850898742676, -1.918663501739502, -1.8079417943954468, -1.6972202062606812, -1.5864986181259155, -1.4757769107818604, -1.3650553226470947, -1.254333734512329, -1.1436121463775635, -1.0328905582427979, -0.9221689105033875, -0.811447262763977, -0.7007256746292114, -0.590004026889801, -0.4792823791503906, -0.368560791015625, -0.2578391432762146, -0.1471175253391266, -0.03639589250087738, 0.07432574033737183, 0.18504735827445984, 0.29576897621154785, 0.40649062395095825, 0.5172122120857239, 0.6279338598251343, 0.7386555075645447, 0.8493770956993103, 0.9600987434387207, 1.0708203315734863, 1.181541919708252, 1.2922636270523071, 1.4029852151870728, 1.513706922531128, 1.6244285106658936, 1.7351502180099487, 1.8458718061447144, 1.95659339427948, 2.067315101623535, 2.178036689758301, 2.2887582778930664, 2.399479866027832]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 0.0, 10.0, 11.0, 10.0, 11.0, 24.0, 31.0, 67.0, 103.0, 127.0, 190.0, 153.0, 123.0, 53.0, 32.0, 18.0, 12.0, 6.0, 7.0, 4.0, 4.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.885369300842285, -2.7565367221832275, -2.62770414352417, -2.4988715648651123, -2.3700389862060547, -2.241206407546997, -2.1123738288879395, -1.9835412502288818, -1.8547086715698242, -1.7258760929107666, -1.597043514251709, -1.4682109355926514, -1.3393783569335938, -1.2105457782745361, -1.0817131996154785, -0.9528806209564209, -0.8240480422973633, -0.6952154636383057, -0.566382884979248, -0.43755030632019043, -0.3087177276611328, -0.1798851490020752, -0.05105257034301758, 0.07778000831604004, 0.20661258697509766, 0.3354451656341553, 0.4642777442932129, 0.5931103229522705, 0.7219429016113281, 0.8507754802703857, 0.9796080589294434, 1.108440637588501, 1.2372732162475586, 1.3661057949066162, 1.4949383735656738, 1.6237709522247314, 1.752603530883789, 1.8814361095428467, 2.0102686882019043, 2.139101266860962, 2.2679338455200195, 2.396766424179077, 2.5255990028381348, 2.6544315814971924, 2.78326416015625, 2.9120967388153076, 3.0409293174743652, 3.169761896133423, 3.2985944747924805, 3.427427053451538, 3.5562596321105957, 3.6850922107696533, 3.813924789428711, 3.9427573680877686, 4.071589946746826, 4.200422286987305, 4.329255104064941, 4.458087921142578, 4.586920261383057, 4.715752601623535, 4.844585418701172, 4.973418235778809, 5.102250576019287, 5.231082916259766, 5.359915733337402]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 6.0, 15.0, 16.0, 23.0, 32.0, 30.0, 67.0, 97.0, 127.0, 206.0, 255.0, 358.0, 470.0, 679.0, 969.0, 1413.0, 1978.0, 2911.0, 4525.0, 7325.0, 13835.0, 33132.0, 115492.0, 597727.0, 181744.0, 43696.0, 16869.0, 8846.0, 5109.0, 3193.0, 2210.0, 1538.0, 1066.0, 715.0, 515.0, 378.0, 300.0, 194.0, 151.0, 105.0, 62.0, 51.0, 33.0, 32.0, 21.0, 13.0, 11.0, 5.0, 1.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.423828125, -1.377349853515625, -1.33087158203125, -1.284393310546875, -1.2379150390625, -1.191436767578125, -1.14495849609375, -1.098480224609375, -1.052001953125, -1.005523681640625, -0.95904541015625, -0.912567138671875, -0.8660888671875, -0.819610595703125, -0.77313232421875, -0.726654052734375, -0.68017578125, -0.633697509765625, -0.58721923828125, -0.540740966796875, -0.4942626953125, -0.447784423828125, -0.40130615234375, -0.354827880859375, -0.308349609375, -0.261871337890625, -0.21539306640625, -0.168914794921875, -0.1224365234375, -0.075958251953125, -0.02947998046875, 0.016998291015625, 0.0634765625, 0.109954833984375, 0.15643310546875, 0.202911376953125, 0.2493896484375, 0.295867919921875, 0.34234619140625, 0.388824462890625, 0.435302734375, 0.481781005859375, 0.52825927734375, 0.574737548828125, 0.6212158203125, 0.667694091796875, 0.71417236328125, 0.760650634765625, 0.80712890625, 0.853607177734375, 0.90008544921875, 0.946563720703125, 0.9930419921875, 1.039520263671875, 1.08599853515625, 1.132476806640625, 1.178955078125, 1.225433349609375, 1.27191162109375, 1.318389892578125, 1.3648681640625, 1.411346435546875, 1.45782470703125, 1.504302978515625, 1.55078125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 5.0, 4.0, 6.0, 9.0, 6.0, 17.0, 28.0, 23.0, 60.0, 84.0, 110.0, 131.0, 138.0, 89.0, 80.0, 52.0, 38.0, 22.0, 20.0, 13.0, 6.0, 6.0, 3.0, 4.0, 7.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.186279296875, -0.17987632751464844, -0.17347335815429688, -0.1670703887939453, -0.16066741943359375, -0.1542644500732422, -0.14786148071289062, -0.14145851135253906, -0.1350555419921875, -0.12865257263183594, -0.12224960327148438, -0.11584663391113281, -0.10944366455078125, -0.10304069519042969, -0.09663772583007812, -0.09023475646972656, -0.083831787109375, -0.07742881774902344, -0.07102584838867188, -0.06462287902832031, -0.05821990966796875, -0.05181694030761719, -0.045413970947265625, -0.03901100158691406, -0.0326080322265625, -0.026205062866210938, -0.019802093505859375, -0.013399124145507812, -0.00699615478515625, -0.0005931854248046875, 0.005809783935546875, 0.012212753295898438, 0.01861572265625, 0.025018692016601562, 0.031421661376953125, 0.03782463073730469, 0.04422760009765625, 0.05063056945800781, 0.057033538818359375, 0.06343650817871094, 0.0698394775390625, 0.07624244689941406, 0.08264541625976562, 0.08904838562011719, 0.09545135498046875, 0.10185432434082031, 0.10825729370117188, 0.11466026306152344, 0.121063232421875, 0.12746620178222656, 0.13386917114257812, 0.1402721405029297, 0.14667510986328125, 0.1530780792236328, 0.15948104858398438, 0.16588401794433594, 0.1722869873046875, 0.17868995666503906, 0.18509292602539062, 0.1914958953857422, 0.19789886474609375, 0.2043018341064453, 0.21070480346679688, 0.21710777282714844, 0.2235107421875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 13.0, 13.0, 22.0, 45.0, 71.0, 163.0, 284.0, 531.0, 943.0, 1811.0, 3679.0, 7471.0, 16285.0, 36715.0, 93020.0, 311838.0, 386786.0, 109638.0, 42741.0, 18728.0, 8846.0, 4311.0, 2158.0, 1096.0, 623.0, 302.0, 188.0, 92.0, 65.0, 28.0, 16.0, 9.0, 9.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3212890625, -1.27423095703125, -1.2271728515625, -1.18011474609375, -1.133056640625, -1.08599853515625, -1.0389404296875, -0.99188232421875, -0.94482421875, -0.89776611328125, -0.8507080078125, -0.80364990234375, -0.756591796875, -0.70953369140625, -0.6624755859375, -0.61541748046875, -0.568359375, -0.52130126953125, -0.4742431640625, -0.42718505859375, -0.380126953125, -0.33306884765625, -0.2860107421875, -0.23895263671875, -0.19189453125, -0.14483642578125, -0.0977783203125, -0.05072021484375, -0.003662109375, 0.04339599609375, 0.0904541015625, 0.13751220703125, 0.1845703125, 0.23162841796875, 0.2786865234375, 0.32574462890625, 0.372802734375, 0.41986083984375, 0.4669189453125, 0.51397705078125, 0.56103515625, 0.60809326171875, 0.6551513671875, 0.70220947265625, 0.749267578125, 0.79632568359375, 0.8433837890625, 0.89044189453125, 0.9375, 0.98455810546875, 1.0316162109375, 1.07867431640625, 1.125732421875, 1.17279052734375, 1.2198486328125, 1.26690673828125, 1.31396484375, 1.36102294921875, 1.4080810546875, 1.45513916015625, 1.502197265625, 1.54925537109375, 1.5963134765625, 1.64337158203125, 1.6904296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 4.0, 7.0, 5.0, 8.0, 12.0, 7.0, 11.0, 13.0, 19.0, 31.0, 17.0, 24.0, 24.0, 21.0, 28.0, 37.0, 32.0, 27.0, 38.0, 57.0, 48.0, 32.0, 27.0, 42.0, 30.0, 27.0, 37.0, 32.0, 22.0, 42.0, 26.0, 31.0, 18.0, 28.0, 21.0, 22.0, 10.0, 14.0, 6.0, 12.0, 12.0, 5.0, 11.0, 6.0, 4.0, 4.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.65966796875, -0.6369094848632812, -0.6141510009765625, -0.5913925170898438, -0.568634033203125, -0.5458755493164062, -0.5231170654296875, -0.5003585815429688, -0.47760009765625, -0.45484161376953125, -0.4320831298828125, -0.40932464599609375, -0.386566162109375, -0.36380767822265625, -0.3410491943359375, -0.31829071044921875, -0.2955322265625, -0.27277374267578125, -0.2500152587890625, -0.22725677490234375, -0.204498291015625, -0.18173980712890625, -0.1589813232421875, -0.13622283935546875, -0.11346435546875, -0.09070587158203125, -0.0679473876953125, -0.04518890380859375, -0.022430419921875, 0.00032806396484375, 0.0230865478515625, 0.04584503173828125, 0.068603515625, 0.09136199951171875, 0.1141204833984375, 0.13687896728515625, 0.159637451171875, 0.18239593505859375, 0.2051544189453125, 0.22791290283203125, 0.25067138671875, 0.27342987060546875, 0.2961883544921875, 0.31894683837890625, 0.341705322265625, 0.36446380615234375, 0.3872222900390625, 0.40998077392578125, 0.4327392578125, 0.45549774169921875, 0.4782562255859375, 0.5010147094726562, 0.523773193359375, 0.5465316772460938, 0.5692901611328125, 0.5920486450195312, 0.61480712890625, 0.6375656127929688, 0.6603240966796875, 0.6830825805664062, 0.705841064453125, 0.7285995483398438, 0.7513580322265625, 0.7741165161132812, 0.796875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 7.0, 4.0, 3.0, 13.0, 19.0, 37.0, 91.0, 316.0, 1233.0, 7414.0, 215047.0, 811131.0, 10876.0, 1699.0, 427.0, 121.0, 44.0, 18.0, 17.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.60546875, -5.43609619140625, -5.2667236328125, -5.09735107421875, -4.927978515625, -4.75860595703125, -4.5892333984375, -4.41986083984375, -4.25048828125, -4.08111572265625, -3.9117431640625, -3.74237060546875, -3.572998046875, -3.40362548828125, -3.2342529296875, -3.06488037109375, -2.8955078125, -2.72613525390625, -2.5567626953125, -2.38739013671875, -2.218017578125, -2.04864501953125, -1.8792724609375, -1.70989990234375, -1.54052734375, -1.37115478515625, -1.2017822265625, -1.03240966796875, -0.863037109375, -0.69366455078125, -0.5242919921875, -0.35491943359375, -0.185546875, -0.01617431640625, 0.1531982421875, 0.32257080078125, 0.491943359375, 0.66131591796875, 0.8306884765625, 1.00006103515625, 1.16943359375, 1.33880615234375, 1.5081787109375, 1.67755126953125, 1.846923828125, 2.01629638671875, 2.1856689453125, 2.35504150390625, 2.5244140625, 2.69378662109375, 2.8631591796875, 3.03253173828125, 3.201904296875, 3.37127685546875, 3.5406494140625, 3.71002197265625, 3.87939453125, 4.04876708984375, 4.2181396484375, 4.38751220703125, 4.556884765625, 4.72625732421875, 4.8956298828125, 5.06500244140625, 5.234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 6.0, 12.0, 9.0, 14.0, 29.0, 34.0, 75.0, 115.0, 172.0, 154.0, 120.0, 81.0, 42.0, 43.0, 23.0, 14.0, 11.0, 11.0, 6.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011366605758666992, -0.00011011958122253418, -0.00010657310485839844, -0.0001030266284942627, -9.948015213012695e-05, -9.593367576599121e-05, -9.238719940185547e-05, -8.884072303771973e-05, -8.529424667358398e-05, -8.174777030944824e-05, -7.82012939453125e-05, -7.465481758117676e-05, -7.110834121704102e-05, -6.756186485290527e-05, -6.401538848876953e-05, -6.046891212463379e-05, -5.692243576049805e-05, -5.3375959396362305e-05, -4.982948303222656e-05, -4.628300666809082e-05, -4.273653030395508e-05, -3.9190053939819336e-05, -3.5643577575683594e-05, -3.209710121154785e-05, -2.855062484741211e-05, -2.5004148483276367e-05, -2.1457672119140625e-05, -1.7911195755004883e-05, -1.436471939086914e-05, -1.0818243026733398e-05, -7.271766662597656e-06, -3.725290298461914e-06, -1.7881393432617188e-07, 3.3676624298095703e-06, 6.9141387939453125e-06, 1.0460615158081055e-05, 1.4007091522216797e-05, 1.755356788635254e-05, 2.110004425048828e-05, 2.4646520614624023e-05, 2.8192996978759766e-05, 3.173947334289551e-05, 3.528594970703125e-05, 3.883242607116699e-05, 4.2378902435302734e-05, 4.5925378799438477e-05, 4.947185516357422e-05, 5.301833152770996e-05, 5.65648078918457e-05, 6.0111284255981445e-05, 6.365776062011719e-05, 6.720423698425293e-05, 7.075071334838867e-05, 7.429718971252441e-05, 7.784366607666016e-05, 8.13901424407959e-05, 8.493661880493164e-05, 8.848309516906738e-05, 9.202957153320312e-05, 9.557604789733887e-05, 9.912252426147461e-05, 0.00010266900062561035, 0.0001062154769897461, 0.00010976195335388184, 0.00011330842971801758]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 9.0, 6.0, 21.0, 29.0, 42.0, 62.0, 104.0, 167.0, 295.0, 588.0, 1060.0, 2258.0, 4996.0, 13703.0, 59997.0, 711425.0, 211519.0, 27234.0, 8268.0, 3343.0, 1531.0, 807.0, 441.0, 250.0, 139.0, 77.0, 53.0, 43.0, 16.0, 17.0, 13.0, 7.0, 5.0, 8.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6015625, -1.54388427734375, -1.4862060546875, -1.42852783203125, -1.370849609375, -1.31317138671875, -1.2554931640625, -1.19781494140625, -1.14013671875, -1.08245849609375, -1.0247802734375, -0.96710205078125, -0.909423828125, -0.85174560546875, -0.7940673828125, -0.73638916015625, -0.6787109375, -0.62103271484375, -0.5633544921875, -0.50567626953125, -0.447998046875, -0.39031982421875, -0.3326416015625, -0.27496337890625, -0.21728515625, -0.15960693359375, -0.1019287109375, -0.04425048828125, 0.013427734375, 0.07110595703125, 0.1287841796875, 0.18646240234375, 0.244140625, 0.30181884765625, 0.3594970703125, 0.41717529296875, 0.474853515625, 0.53253173828125, 0.5902099609375, 0.64788818359375, 0.70556640625, 0.76324462890625, 0.8209228515625, 0.87860107421875, 0.936279296875, 0.99395751953125, 1.0516357421875, 1.10931396484375, 1.1669921875, 1.22467041015625, 1.2823486328125, 1.34002685546875, 1.397705078125, 1.45538330078125, 1.5130615234375, 1.57073974609375, 1.62841796875, 1.68609619140625, 1.7437744140625, 1.80145263671875, 1.859130859375, 1.91680908203125, 1.9744873046875, 2.03216552734375, 2.08984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 6.0, 6.0, 13.0, 19.0, 25.0, 45.0, 56.0, 127.0, 220.0, 178.0, 111.0, 58.0, 41.0, 21.0, 18.0, 16.0, 11.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.93511962890625, -0.8927001953125, -0.85028076171875, -0.807861328125, -0.76544189453125, -0.7230224609375, -0.68060302734375, -0.63818359375, -0.59576416015625, -0.5533447265625, -0.51092529296875, -0.468505859375, -0.42608642578125, -0.3836669921875, -0.34124755859375, -0.298828125, -0.25640869140625, -0.2139892578125, -0.17156982421875, -0.129150390625, -0.08673095703125, -0.0443115234375, -0.00189208984375, 0.04052734375, 0.08294677734375, 0.1253662109375, 0.16778564453125, 0.210205078125, 0.25262451171875, 0.2950439453125, 0.33746337890625, 0.3798828125, 0.42230224609375, 0.4647216796875, 0.50714111328125, 0.549560546875, 0.59197998046875, 0.6343994140625, 0.67681884765625, 0.71923828125, 0.76165771484375, 0.8040771484375, 0.84649658203125, 0.888916015625, 0.93133544921875, 0.9737548828125, 1.01617431640625, 1.05859375, 1.10101318359375, 1.1434326171875, 1.18585205078125, 1.228271484375, 1.27069091796875, 1.3131103515625, 1.35552978515625, 1.39794921875, 1.44036865234375, 1.4827880859375, 1.52520751953125, 1.567626953125, 1.61004638671875, 1.6524658203125, 1.69488525390625, 1.7373046875]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 6.0, 13.0, 28.0, 68.0, 150.0, 279.0, 237.0, 108.0, 56.0, 23.0, 16.0, 6.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.321365356445312, -9.800466537475586, -9.279568672180176, -8.75866985321045, -8.237771987915039, -7.7168731689453125, -7.195974349975586, -6.675076007843018, -6.154177665710449, -5.633279323577881, -5.1123809814453125, -4.591482162475586, -4.070583820343018, -3.549685478210449, -3.0287868976593018, -2.5078883171081543, -1.986989974975586, -1.466091513633728, -0.9451930522918701, -0.4242945909500122, 0.0966038703918457, 0.6175022125244141, 1.1384007930755615, 1.659299373626709, 2.1801977157592773, 2.7010960578918457, 3.221994638442993, 3.7428932189941406, 4.263791561126709, 4.784689903259277, 5.305588722229004, 5.826487064361572, 6.347385406494141, 6.868283748626709, 7.389182090759277, 7.910080909729004, 8.430978775024414, 8.95187759399414, 9.472776412963867, 9.993675231933594, 10.514573097229004, 11.03547191619873, 11.55636978149414, 12.077268600463867, 12.598167419433594, 13.119065284729004, 13.63996410369873, 14.16086196899414, 14.681760787963867, 15.202659606933594, 15.723557472229004, 16.244455337524414, 16.76535415649414, 17.286252975463867, 17.807151794433594, 18.32805061340332, 18.848949432373047, 19.369848251342773, 19.8907470703125, 20.411643981933594, 20.93254280090332, 21.453441619873047, 21.974340438842773, 22.4952392578125, 23.016136169433594]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 4.0, 0.0, 4.0, 7.0, 6.0, 5.0, 12.0, 9.0, 18.0, 22.0, 38.0, 41.0, 63.0, 75.0, 91.0, 94.0, 95.0, 82.0, 89.0, 64.0, 41.0, 40.0, 40.0, 15.0, 7.0, 10.0, 6.0, 7.0, 2.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.0383882522583, -11.698543548583984, -11.358697891235352, -11.018853187561035, -10.679008483886719, -10.339162826538086, -9.99931812286377, -9.659473419189453, -9.31962776184082, -8.979783058166504, -8.639937400817871, -8.300092697143555, -7.960247993469238, -7.620402812957764, -7.280557632446289, -6.940712928771973, -6.600868225097656, -6.261023044586182, -5.921178340911865, -5.581333160400391, -5.241488456726074, -4.9016432762146, -4.561798095703125, -4.221953392028809, -3.882108211517334, -3.5422632694244385, -3.202418327331543, -2.8625731468200684, -2.522728204727173, -2.1828832626342773, -1.8430380821228027, -1.5031931400299072, -1.1633472442626953, -0.823502242565155, -0.48365724086761475, -0.1438121795654297, 0.19603276252746582, 0.5358777046203613, 0.8757228851318359, 1.2155678272247314, 1.555412769317627, 1.8952577114105225, 2.235102653503418, 2.5749478340148926, 2.914792776107788, 3.2546377182006836, 3.594482898712158, 3.9343278408050537, 4.274172782897949, 4.614017963409424, 4.95386266708374, 5.293707847595215, 5.633552551269531, 5.973397731781006, 6.3132429122924805, 6.653087615966797, 6.9929327964782715, 7.332777976989746, 7.6726226806640625, 8.012468338012695, 8.352313041687012, 8.692157745361328, 9.032003402709961, 9.371848106384277, 9.711692810058594]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 4.0, 4.0, 5.0, 3.0, 9.0, 8.0, 8.0, 13.0, 17.0, 30.0, 39.0, 45.0, 80.0, 161.0, 224.0, 589.0, 1206.0, 2886.0, 9574.0, 73246.0, 4040994.0, 51433.0, 8724.0, 2689.0, 1150.0, 558.0, 254.0, 129.0, 80.0, 40.0, 27.0, 19.0, 8.0, 17.0, 8.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8203125, -9.55078125, -9.28125, -9.01171875, -8.7421875, -8.47265625, -8.203125, -7.93359375, -7.6640625, -7.39453125, -7.125, -6.85546875, -6.5859375, -6.31640625, -6.046875, -5.77734375, -5.5078125, -5.23828125, -4.96875, -4.69921875, -4.4296875, -4.16015625, -3.890625, -3.62109375, -3.3515625, -3.08203125, -2.8125, -2.54296875, -2.2734375, -2.00390625, -1.734375, -1.46484375, -1.1953125, -0.92578125, -0.65625, -0.38671875, -0.1171875, 0.15234375, 0.421875, 0.69140625, 0.9609375, 1.23046875, 1.5, 1.76953125, 2.0390625, 2.30859375, 2.578125, 2.84765625, 3.1171875, 3.38671875, 3.65625, 3.92578125, 4.1953125, 4.46484375, 4.734375, 5.00390625, 5.2734375, 5.54296875, 5.8125, 6.08203125, 6.3515625, 6.62109375, 6.890625, 7.16015625, 7.4296875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 5.0, 6.0, 9.0, 12.0, 6.0, 24.0, 14.0, 26.0, 53.0, 70.0, 64.0, 97.0, 107.0, 91.0, 100.0, 62.0, 60.0, 45.0, 23.0, 24.0, 12.0, 21.0, 4.0, 11.0, 8.0, 4.0, 3.0, 3.0, 4.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.19775390625, -0.1917591094970703, -0.18576431274414062, -0.17976951599121094, -0.17377471923828125, -0.16777992248535156, -0.16178512573242188, -0.1557903289794922, -0.1497955322265625, -0.1438007354736328, -0.13780593872070312, -0.13181114196777344, -0.12581634521484375, -0.11982154846191406, -0.11382675170898438, -0.10783195495605469, -0.101837158203125, -0.09584236145019531, -0.08984756469726562, -0.08385276794433594, -0.07785797119140625, -0.07186317443847656, -0.06586837768554688, -0.05987358093261719, -0.0538787841796875, -0.04788398742675781, -0.041889190673828125, -0.03589439392089844, -0.02989959716796875, -0.023904800415039062, -0.017910003662109375, -0.011915206909179688, -0.00592041015625, 7.43865966796875e-05, 0.006069183349609375, 0.012063980102539062, 0.01805877685546875, 0.024053573608398438, 0.030048370361328125, 0.03604316711425781, 0.0420379638671875, 0.04803276062011719, 0.054027557373046875, 0.06002235412597656, 0.06601715087890625, 0.07201194763183594, 0.07800674438476562, 0.08400154113769531, 0.089996337890625, 0.09599113464355469, 0.10198593139648438, 0.10798072814941406, 0.11397552490234375, 0.11997032165527344, 0.12596511840820312, 0.1319599151611328, 0.1379547119140625, 0.1439495086669922, 0.14994430541992188, 0.15593910217285156, 0.16193389892578125, 0.16792869567871094, 0.17392349243164062, 0.1799182891845703, 0.1859130859375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 6.0, 2.0, 0.0, 9.0, 6.0, 9.0, 12.0, 4.0, 9.0, 11.0, 21.0, 19.0, 27.0, 24.0, 50.0, 91.0, 486.0, 6438.0, 3769507.0, 412274.0, 4625.0, 351.0, 94.0, 48.0, 30.0, 32.0, 16.0, 18.0, 15.0, 11.0, 7.0, 8.0, 2.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-21.4375, -20.8724365234375, -20.307373046875, -19.7423095703125, -19.17724609375, -18.6121826171875, -18.047119140625, -17.4820556640625, -16.9169921875, -16.3519287109375, -15.786865234375, -15.2218017578125, -14.65673828125, -14.0916748046875, -13.526611328125, -12.9615478515625, -12.396484375, -11.8314208984375, -11.266357421875, -10.7012939453125, -10.13623046875, -9.5711669921875, -9.006103515625, -8.4410400390625, -7.8759765625, -7.3109130859375, -6.745849609375, -6.1807861328125, -5.61572265625, -5.0506591796875, -4.485595703125, -3.9205322265625, -3.35546875, -2.7904052734375, -2.225341796875, -1.6602783203125, -1.09521484375, -0.5301513671875, 0.034912109375, 0.5999755859375, 1.1650390625, 1.7301025390625, 2.295166015625, 2.8602294921875, 3.42529296875, 3.9903564453125, 4.555419921875, 5.1204833984375, 5.685546875, 6.2506103515625, 6.815673828125, 7.3807373046875, 7.94580078125, 8.5108642578125, 9.075927734375, 9.6409912109375, 10.2060546875, 10.7711181640625, 11.336181640625, 11.9012451171875, 12.46630859375, 13.0313720703125, 13.596435546875, 14.1614990234375, 14.7265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 9.0, 12.0, 4.0, 15.0, 14.0, 23.0, 28.0, 34.0, 36.0, 54.0, 104.0, 194.0, 557.0, 2160.0, 343.0, 135.0, 84.0, 56.0, 40.0, 29.0, 25.0, 24.0, 9.0, 9.0, 10.0, 10.0, 8.0, 6.0, 3.0, 5.0, 7.0, 1.0, 3.0, 1.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4150390625, -0.39984130859375, -0.3846435546875, -0.36944580078125, -0.354248046875, -0.33905029296875, -0.3238525390625, -0.30865478515625, -0.29345703125, -0.27825927734375, -0.2630615234375, -0.24786376953125, -0.232666015625, -0.21746826171875, -0.2022705078125, -0.18707275390625, -0.171875, -0.15667724609375, -0.1414794921875, -0.12628173828125, -0.111083984375, -0.09588623046875, -0.0806884765625, -0.06549072265625, -0.05029296875, -0.03509521484375, -0.0198974609375, -0.00469970703125, 0.010498046875, 0.02569580078125, 0.0408935546875, 0.05609130859375, 0.0712890625, 0.08648681640625, 0.1016845703125, 0.11688232421875, 0.132080078125, 0.14727783203125, 0.1624755859375, 0.17767333984375, 0.19287109375, 0.20806884765625, 0.2232666015625, 0.23846435546875, 0.253662109375, 0.26885986328125, 0.2840576171875, 0.29925537109375, 0.314453125, 0.32965087890625, 0.3448486328125, 0.36004638671875, 0.375244140625, 0.39044189453125, 0.4056396484375, 0.42083740234375, 0.43603515625, 0.45123291015625, 0.4664306640625, 0.48162841796875, 0.496826171875, 0.51202392578125, 0.5272216796875, 0.54241943359375, 0.5576171875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 7.0, 20.0, 49.0, 116.0, 275.0, 279.0, 135.0, 66.0, 30.0, 10.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.371089458465576, -4.181789875030518, -3.992490291595459, -3.8031907081604004, -3.613891124725342, -3.424591541290283, -3.2352917194366455, -3.045992136001587, -2.8566925525665283, -2.6673929691314697, -2.478093385696411, -2.2887935638427734, -2.099493980407715, -1.9101945161819458, -1.7208948135375977, -1.531595230102539, -1.3422956466674805, -1.1529960632324219, -0.9636964201927185, -0.7743967771530151, -0.5850971937179565, -0.39579761028289795, -0.2064979076385498, -0.01719832420349121, 0.17210125923156738, 0.36140087246894836, 0.5507004857063293, 0.7400001287460327, 0.9292997121810913, 1.11859929561615, 1.307898998260498, 1.4971985816955566, 1.6864986419677734, 1.875798225402832, 2.0650978088378906, 2.254397392272949, 2.443696975708008, 2.6329965591430664, 2.822296380996704, 3.0115959644317627, 3.2008955478668213, 3.39019513130188, 3.5794947147369385, 3.768794536590576, 3.9580941200256348, 4.147393703460693, 4.336693286895752, 4.5259928703308105, 4.715292453765869, 4.904592037200928, 5.093891620635986, 5.283191204071045, 5.4724907875061035, 5.661790370941162, 5.851090431213379, 6.0403900146484375, 6.229689598083496, 6.418989181518555, 6.608288764953613, 6.797588348388672, 6.9868879318237305, 7.176187515258789, 7.365487098693848, 7.554786682128906, 7.744086265563965]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 4.0, 3.0, 2.0, 4.0, 12.0, 13.0, 21.0, 25.0, 24.0, 46.0, 41.0, 56.0, 71.0, 81.0, 66.0, 85.0, 79.0, 65.0, 60.0, 42.0, 35.0, 38.0, 23.0, 22.0, 19.0, 13.0, 13.0, 8.0, 8.0, 4.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.019285202026367, -1.9448639154434204, -1.8704426288604736, -1.7960213422775269, -1.72160005569458, -1.6471786499023438, -1.572757363319397, -1.4983360767364502, -1.4239147901535034, -1.3494935035705566, -1.2750722169876099, -1.200650930404663, -1.1262295246124268, -1.0518083572387695, -0.9773869514465332, -0.9029656648635864, -0.8285443782806396, -0.7541230916976929, -0.6797018051147461, -0.6052804589271545, -0.5308591723442078, -0.456437885761261, -0.3820165693759918, -0.30759525299072266, -0.23317396640777588, -0.1587526649236679, -0.08433136343955994, -0.009910061955451965, 0.064511239528656, 0.13893252611160278, 0.21335384249687195, 0.2877751588821411, 0.3621964454650879, 0.43661773204803467, 0.5110390186309814, 0.585460364818573, 0.6598816514015198, 0.7343029379844666, 0.8087242841720581, 0.8831455707550049, 0.9575668573379517, 1.0319881439208984, 1.1064094305038452, 1.180830717086792, 1.2552521228790283, 1.3296732902526855, 1.4040946960449219, 1.4785159826278687, 1.5529372692108154, 1.6273585557937622, 1.701779842376709, 1.7762011289596558, 1.8506224155426025, 1.9250438213348389, 1.9994651079177856, 2.0738863945007324, 2.1483078002929688, 2.222729206085205, 2.2971503734588623, 2.3715717792510986, 2.445992946624756, 2.520414352416992, 2.5948355197906494, 2.6692569255828857, 2.743678092956543]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 10.0, 13.0, 14.0, 21.0, 28.0, 49.0, 52.0, 106.0, 198.0, 402.0, 1058.0, 3140.0, 11705.0, 58872.0, 480769.0, 423699.0, 53173.0, 10516.0, 2949.0, 949.0, 385.0, 173.0, 86.0, 49.0, 46.0, 20.0, 25.0, 15.0, 5.0, 5.0, 7.0, 5.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.181640625, -2.1036376953125, -2.025634765625, -1.9476318359375, -1.86962890625, -1.7916259765625, -1.713623046875, -1.6356201171875, -1.5576171875, -1.4796142578125, -1.401611328125, -1.3236083984375, -1.24560546875, -1.1676025390625, -1.089599609375, -1.0115966796875, -0.93359375, -0.8555908203125, -0.777587890625, -0.6995849609375, -0.62158203125, -0.5435791015625, -0.465576171875, -0.3875732421875, -0.3095703125, -0.2315673828125, -0.153564453125, -0.0755615234375, 0.00244140625, 0.0804443359375, 0.158447265625, 0.2364501953125, 0.314453125, 0.3924560546875, 0.470458984375, 0.5484619140625, 0.62646484375, 0.7044677734375, 0.782470703125, 0.8604736328125, 0.9384765625, 1.0164794921875, 1.094482421875, 1.1724853515625, 1.25048828125, 1.3284912109375, 1.406494140625, 1.4844970703125, 1.5625, 1.6405029296875, 1.718505859375, 1.7965087890625, 1.87451171875, 1.9525146484375, 2.030517578125, 2.1085205078125, 2.1865234375, 2.2645263671875, 2.342529296875, 2.4205322265625, 2.49853515625, 2.5765380859375, 2.654541015625, 2.7325439453125, 2.810546875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 9.0, 22.0, 29.0, 60.0, 106.0, 137.0, 163.0, 156.0, 111.0, 85.0, 54.0, 31.0, 22.0, 11.0, 9.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191650390625, -0.18101119995117188, -0.17037200927734375, -0.15973281860351562, -0.1490936279296875, -0.13845443725585938, -0.12781524658203125, -0.11717605590820312, -0.106536865234375, -0.09589767456054688, -0.08525848388671875, -0.07461929321289062, -0.0639801025390625, -0.053340911865234375, -0.04270172119140625, -0.032062530517578125, -0.02142333984375, -0.010784149169921875, -0.00014495849609375, 0.010494232177734375, 0.0211334228515625, 0.031772613525390625, 0.04241180419921875, 0.053050994873046875, 0.063690185546875, 0.07432937622070312, 0.08496856689453125, 0.09560775756835938, 0.1062469482421875, 0.11688613891601562, 0.12752532958984375, 0.13816452026367188, 0.1488037109375, 0.15944290161132812, 0.17008209228515625, 0.18072128295898438, 0.1913604736328125, 0.20199966430664062, 0.21263885498046875, 0.22327804565429688, 0.233917236328125, 0.24455642700195312, 0.25519561767578125, 0.2658348083496094, 0.2764739990234375, 0.2871131896972656, 0.29775238037109375, 0.3083915710449219, 0.31903076171875, 0.3296699523925781, 0.34030914306640625, 0.3509483337402344, 0.3615875244140625, 0.3722267150878906, 0.38286590576171875, 0.3935050964355469, 0.404144287109375, 0.4147834777832031, 0.42542266845703125, 0.4360618591308594, 0.4467010498046875, 0.4573402404785156, 0.46797943115234375, 0.4786186218261719, 0.4892578125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 15.0, 9.0, 22.0, 26.0, 48.0, 74.0, 89.0, 146.0, 226.0, 347.0, 564.0, 982.0, 1666.0, 2970.0, 5254.0, 10132.0, 20244.0, 41817.0, 90987.0, 205547.0, 316136.0, 187598.0, 83783.0, 38536.0, 18774.0, 9984.0, 5250.0, 2988.0, 1642.0, 969.0, 614.0, 381.0, 254.0, 155.0, 94.0, 72.0, 47.0, 27.0, 25.0, 20.0, 13.0, 8.0, 3.0, 9.0, 3.0, 0.0, 3.0, 3.0], "bins": [-1.185546875, -1.15301513671875, -1.1204833984375, -1.08795166015625, -1.055419921875, -1.02288818359375, -0.9903564453125, -0.95782470703125, -0.92529296875, -0.89276123046875, -0.8602294921875, -0.82769775390625, -0.795166015625, -0.76263427734375, -0.7301025390625, -0.69757080078125, -0.6650390625, -0.63250732421875, -0.5999755859375, -0.56744384765625, -0.534912109375, -0.50238037109375, -0.4698486328125, -0.43731689453125, -0.40478515625, -0.37225341796875, -0.3397216796875, -0.30718994140625, -0.274658203125, -0.24212646484375, -0.2095947265625, -0.17706298828125, -0.14453125, -0.11199951171875, -0.0794677734375, -0.04693603515625, -0.014404296875, 0.01812744140625, 0.0506591796875, 0.08319091796875, 0.11572265625, 0.14825439453125, 0.1807861328125, 0.21331787109375, 0.245849609375, 0.27838134765625, 0.3109130859375, 0.34344482421875, 0.3759765625, 0.40850830078125, 0.4410400390625, 0.47357177734375, 0.506103515625, 0.53863525390625, 0.5711669921875, 0.60369873046875, 0.63623046875, 0.66876220703125, 0.7012939453125, 0.73382568359375, 0.766357421875, 0.79888916015625, 0.8314208984375, 0.86395263671875, 0.896484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 0.0, 6.0, 8.0, 6.0, 2.0, 4.0, 6.0, 12.0, 13.0, 7.0, 16.0, 23.0, 16.0, 17.0, 27.0, 35.0, 32.0, 27.0, 29.0, 39.0, 38.0, 46.0, 38.0, 40.0, 37.0, 35.0, 28.0, 32.0, 31.0, 35.0, 33.0, 25.0, 31.0, 29.0, 25.0, 22.0, 22.0, 19.0, 15.0, 19.0, 10.0, 9.0, 18.0, 9.0, 12.0, 6.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5574569702148438, -0.5372772216796875, -0.5170974731445312, -0.496917724609375, -0.47673797607421875, -0.4565582275390625, -0.43637847900390625, -0.41619873046875, -0.39601898193359375, -0.3758392333984375, -0.35565948486328125, -0.335479736328125, -0.31529998779296875, -0.2951202392578125, -0.27494049072265625, -0.2547607421875, -0.23458099365234375, -0.2144012451171875, -0.19422149658203125, -0.174041748046875, -0.15386199951171875, -0.1336822509765625, -0.11350250244140625, -0.09332275390625, -0.07314300537109375, -0.0529632568359375, -0.03278350830078125, -0.012603759765625, 0.00757598876953125, 0.0277557373046875, 0.04793548583984375, 0.068115234375, 0.08829498291015625, 0.1084747314453125, 0.12865447998046875, 0.148834228515625, 0.16901397705078125, 0.1891937255859375, 0.20937347412109375, 0.22955322265625, 0.24973297119140625, 0.2699127197265625, 0.29009246826171875, 0.310272216796875, 0.33045196533203125, 0.3506317138671875, 0.37081146240234375, 0.3909912109375, 0.41117095947265625, 0.4313507080078125, 0.45153045654296875, 0.471710205078125, 0.49188995361328125, 0.5120697021484375, 0.5322494506835938, 0.55242919921875, 0.5726089477539062, 0.5927886962890625, 0.6129684448242188, 0.633148193359375, 0.6533279418945312, 0.6735076904296875, 0.6936874389648438, 0.7138671875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 18.0, 9.0, 19.0, 21.0, 19.0, 24.0, 44.0, 72.0, 142.0, 327.0, 691.0, 1865.0, 4941.0, 20442.0, 220496.0, 732072.0, 52839.0, 9471.0, 2841.0, 1120.0, 477.0, 237.0, 129.0, 63.0, 41.0, 33.0, 23.0, 15.0, 9.0, 9.0, 8.0, 5.0, 7.0, 4.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.708984375, -2.622283935546875, -2.53558349609375, -2.448883056640625, -2.3621826171875, -2.275482177734375, -2.18878173828125, -2.102081298828125, -2.015380859375, -1.928680419921875, -1.84197998046875, -1.755279541015625, -1.6685791015625, -1.581878662109375, -1.49517822265625, -1.408477783203125, -1.32177734375, -1.235076904296875, -1.14837646484375, -1.061676025390625, -0.9749755859375, -0.888275146484375, -0.80157470703125, -0.714874267578125, -0.628173828125, -0.541473388671875, -0.45477294921875, -0.368072509765625, -0.2813720703125, -0.194671630859375, -0.10797119140625, -0.021270751953125, 0.0654296875, 0.152130126953125, 0.23883056640625, 0.325531005859375, 0.4122314453125, 0.498931884765625, 0.58563232421875, 0.672332763671875, 0.759033203125, 0.845733642578125, 0.93243408203125, 1.019134521484375, 1.1058349609375, 1.192535400390625, 1.27923583984375, 1.365936279296875, 1.45263671875, 1.539337158203125, 1.62603759765625, 1.712738037109375, 1.7994384765625, 1.886138916015625, 1.97283935546875, 2.059539794921875, 2.146240234375, 2.232940673828125, 2.31964111328125, 2.406341552734375, 2.4930419921875, 2.579742431640625, 2.66644287109375, 2.753143310546875, 2.83984375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 14.0, 10.0, 27.0, 30.0, 42.0, 64.0, 105.0, 121.0, 135.0, 117.0, 95.0, 64.0, 53.0, 28.0, 19.0, 10.0, 17.0, 7.0, 9.0, 3.0, 4.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00024700164794921875, -0.00024004653096199036, -0.00023309141397476196, -0.00022613629698753357, -0.00021918118000030518, -0.00021222606301307678, -0.0002052709460258484, -0.00019831582903862, -0.0001913607120513916, -0.0001844055950641632, -0.00017745047807693481, -0.00017049536108970642, -0.00016354024410247803, -0.00015658512711524963, -0.00014963001012802124, -0.00014267489314079285, -0.00013571977615356445, -0.00012876465916633606, -0.00012180954217910767, -0.00011485442519187927, -0.00010789930820465088, -0.00010094419121742249, -9.398907423019409e-05, -8.70339572429657e-05, -8.00788402557373e-05, -7.312372326850891e-05, -6.616860628128052e-05, -5.9213489294052124e-05, -5.225837230682373e-05, -4.530325531959534e-05, -3.834813833236694e-05, -3.139302134513855e-05, -2.4437904357910156e-05, -1.7482787370681763e-05, -1.0527670383453369e-05, -3.5725533962249756e-06, 3.382563591003418e-06, 1.0337680578231812e-05, 1.7292797565460205e-05, 2.42479145526886e-05, 3.120303153991699e-05, 3.8158148527145386e-05, 4.511326551437378e-05, 5.206838250160217e-05, 5.9023499488830566e-05, 6.597861647605896e-05, 7.293373346328735e-05, 7.988885045051575e-05, 8.684396743774414e-05, 9.379908442497253e-05, 0.00010075420141220093, 0.00010770931839942932, 0.00011466443538665771, 0.00012161955237388611, 0.0001285746693611145, 0.0001355297863483429, 0.0001424849033355713, 0.00014944002032279968, 0.00015639513731002808, 0.00016335025429725647, 0.00017030537128448486, 0.00017726048827171326, 0.00018421560525894165, 0.00019117072224617004, 0.00019812583923339844]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 10.0, 13.0, 24.0, 31.0, 47.0, 85.0, 191.0, 502.0, 1816.0, 9274.0, 811122.0, 217274.0, 6144.0, 1323.0, 407.0, 131.0, 59.0, 35.0, 23.0, 18.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-12.546875, -12.2674560546875, -11.988037109375, -11.7086181640625, -11.42919921875, -11.1497802734375, -10.870361328125, -10.5909423828125, -10.3115234375, -10.0321044921875, -9.752685546875, -9.4732666015625, -9.19384765625, -8.9144287109375, -8.635009765625, -8.3555908203125, -8.076171875, -7.7967529296875, -7.517333984375, -7.2379150390625, -6.95849609375, -6.6790771484375, -6.399658203125, -6.1202392578125, -5.8408203125, -5.5614013671875, -5.281982421875, -5.0025634765625, -4.72314453125, -4.4437255859375, -4.164306640625, -3.8848876953125, -3.60546875, -3.3260498046875, -3.046630859375, -2.7672119140625, -2.48779296875, -2.2083740234375, -1.928955078125, -1.6495361328125, -1.3701171875, -1.0906982421875, -0.811279296875, -0.5318603515625, -0.25244140625, 0.0269775390625, 0.306396484375, 0.5858154296875, 0.865234375, 1.1446533203125, 1.424072265625, 1.7034912109375, 1.98291015625, 2.2623291015625, 2.541748046875, 2.8211669921875, 3.1005859375, 3.3800048828125, 3.659423828125, 3.9388427734375, 4.21826171875, 4.4976806640625, 4.777099609375, 5.0565185546875, 5.3359375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 4.0, 3.0, 4.0, 11.0, 7.0, 11.0, 20.0, 23.0, 44.0, 205.0, 307.0, 207.0, 73.0, 30.0, 18.0, 11.0, 8.0, 10.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.78515625, -3.698089599609375, -3.61102294921875, -3.523956298828125, -3.4368896484375, -3.349822998046875, -3.26275634765625, -3.175689697265625, -3.088623046875, -3.001556396484375, -2.91448974609375, -2.827423095703125, -2.7403564453125, -2.653289794921875, -2.56622314453125, -2.479156494140625, -2.39208984375, -2.305023193359375, -2.21795654296875, -2.130889892578125, -2.0438232421875, -1.956756591796875, -1.86968994140625, -1.782623291015625, -1.695556640625, -1.608489990234375, -1.52142333984375, -1.434356689453125, -1.3472900390625, -1.260223388671875, -1.17315673828125, -1.086090087890625, -0.9990234375, -0.911956787109375, -0.82489013671875, -0.737823486328125, -0.6507568359375, -0.563690185546875, -0.47662353515625, -0.389556884765625, -0.302490234375, -0.215423583984375, -0.12835693359375, -0.041290283203125, 0.0457763671875, 0.132843017578125, 0.21990966796875, 0.306976318359375, 0.39404296875, 0.481109619140625, 0.56817626953125, 0.655242919921875, 0.7423095703125, 0.829376220703125, 0.91644287109375, 1.003509521484375, 1.090576171875, 1.177642822265625, 1.26470947265625, 1.351776123046875, 1.4388427734375, 1.525909423828125, 1.61297607421875, 1.700042724609375, 1.787109375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 3.0, 11.0, 29.0, 87.0, 278.0, 409.0, 153.0, 25.0, 9.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.718629837036133, -18.506650924682617, -17.2946720123291, -16.082693099975586, -14.87071418762207, -13.658735275268555, -12.446755409240723, -11.234776496887207, -10.022797584533691, -8.810818672180176, -7.59883975982666, -6.386860370635986, -5.174881458282471, -3.962902545928955, -2.7509231567382812, -1.5389442443847656, -0.32696533203125, 0.8850136995315552, 2.0969927310943604, 3.308971881866455, 4.520950794219971, 5.732929706573486, 6.94490909576416, 8.156888008117676, 9.368866920471191, 10.580845832824707, 11.792824745178223, 13.004804611206055, 14.21678352355957, 15.428762435913086, 16.6407413482666, 17.852720260620117, 19.064701080322266, 20.27667999267578, 21.488658905029297, 22.700637817382812, 23.912616729736328, 25.124595642089844, 26.33657455444336, 27.548553466796875, 28.76053237915039, 29.972511291503906, 31.184490203857422, 32.39646911621094, 33.60844802856445, 34.82042694091797, 36.032405853271484, 37.244384765625, 38.45636749267578, 39.6683464050293, 40.88032531738281, 42.09230422973633, 43.304283142089844, 44.51626205444336, 45.728240966796875, 46.94021987915039, 48.152198791503906, 49.36417770385742, 50.57615661621094, 51.78813552856445, 53.00011444091797, 54.212093353271484, 55.424072265625, 56.636051177978516, 57.84803009033203]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 16.0, 28.0, 46.0, 80.0, 80.0, 108.0, 127.0, 143.0, 98.0, 90.0, 76.0, 49.0, 29.0, 11.0, 12.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.699911594390869, -5.1720476150512695, -4.64418363571167, -4.11631965637207, -3.58845591545105, -3.06059193611145, -2.5327281951904297, -2.00486421585083, -1.4770002365112305, -0.9491363167762756, -0.4212723970413208, 0.10659146308898926, 0.6344554424285889, 1.1623194217681885, 1.690183162689209, 2.2180471420288086, 2.745911121368408, 3.273775100708008, 3.8016390800476074, 4.329503059387207, 4.857366561889648, 5.385231018066406, 5.913094520568848, 6.440958499908447, 6.968822479248047, 7.4966864585876465, 8.024550437927246, 8.552413940429688, 9.080278396606445, 9.608141899108887, 10.136005401611328, 10.663869857788086, 11.191732406616211, 11.719595909118652, 12.24746036529541, 12.775323867797852, 13.30318832397461, 13.83105182647705, 14.358915328979492, 14.88677978515625, 15.414644241333008, 15.94250774383545, 16.47037124633789, 16.99823570251465, 17.526100158691406, 18.053964614868164, 18.58182716369629, 19.109691619873047, 19.637554168701172, 20.16541862487793, 20.693281173706055, 21.221145629882812, 21.74901008605957, 22.276874542236328, 22.804737091064453, 23.33260154724121, 23.86046600341797, 24.388330459594727, 24.91619300842285, 25.44405746459961, 25.971921920776367, 26.499786376953125, 27.02764892578125, 27.555513381958008, 28.083377838134766]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 17.0, 25.0, 47.0, 111.0, 386.0, 2875.0, 279460.0, 3905627.0, 4673.0, 647.0, 213.0, 96.0, 49.0, 24.0, 14.0, 7.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4140625, -10.8155517578125, -10.217041015625, -9.6185302734375, -9.02001953125, -8.4215087890625, -7.822998046875, -7.2244873046875, -6.6259765625, -6.0274658203125, -5.428955078125, -4.8304443359375, -4.23193359375, -3.6334228515625, -3.034912109375, -2.4364013671875, -1.837890625, -1.2393798828125, -0.640869140625, -0.0423583984375, 0.55615234375, 1.1546630859375, 1.753173828125, 2.3516845703125, 2.9501953125, 3.5487060546875, 4.147216796875, 4.7457275390625, 5.34423828125, 5.9427490234375, 6.541259765625, 7.1397705078125, 7.73828125, 8.3367919921875, 8.935302734375, 9.5338134765625, 10.13232421875, 10.7308349609375, 11.329345703125, 11.9278564453125, 12.5263671875, 13.1248779296875, 13.723388671875, 14.3218994140625, 14.92041015625, 15.5189208984375, 16.117431640625, 16.7159423828125, 17.314453125, 17.9129638671875, 18.511474609375, 19.1099853515625, 19.70849609375, 20.3070068359375, 20.905517578125, 21.5040283203125, 22.1025390625, 22.7010498046875, 23.299560546875, 23.8980712890625, 24.49658203125, 25.0950927734375, 25.693603515625, 26.2921142578125, 26.890625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 14.0, 18.0, 37.0, 69.0, 97.0, 140.0, 149.0, 158.0, 111.0, 90.0, 64.0, 27.0, 16.0, 5.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.281982421875, -0.2661781311035156, -0.25037384033203125, -0.23456954956054688, -0.2187652587890625, -0.20296096801757812, -0.18715667724609375, -0.17135238647460938, -0.155548095703125, -0.13974380493164062, -0.12393951416015625, -0.10813522338867188, -0.0923309326171875, -0.07652664184570312, -0.06072235107421875, -0.044918060302734375, -0.02911376953125, -0.013309478759765625, 0.00249481201171875, 0.018299102783203125, 0.0341033935546875, 0.049907684326171875, 0.06571197509765625, 0.08151626586914062, 0.097320556640625, 0.11312484741210938, 0.12892913818359375, 0.14473342895507812, 0.1605377197265625, 0.17634201049804688, 0.19214630126953125, 0.20795059204101562, 0.2237548828125, 0.23955917358398438, 0.25536346435546875, 0.2711677551269531, 0.2869720458984375, 0.3027763366699219, 0.31858062744140625, 0.3343849182128906, 0.350189208984375, 0.3659934997558594, 0.38179779052734375, 0.3976020812988281, 0.4134063720703125, 0.4292106628417969, 0.44501495361328125, 0.4608192443847656, 0.47662353515625, 0.4924278259277344, 0.5082321166992188, 0.5240364074707031, 0.5398406982421875, 0.5556449890136719, 0.5714492797851562, 0.5872535705566406, 0.603057861328125, 0.6188621520996094, 0.6346664428710938, 0.6504707336425781, 0.6662750244140625, 0.6820793151855469, 0.6978836059570312, 0.7136878967285156, 0.7294921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 9.0, 9.0, 14.0, 25.0, 40.0, 59.0, 77.0, 147.0, 277.0, 1577.0, 98730.0, 4084069.0, 8120.0, 472.0, 185.0, 144.0, 115.0, 76.0, 52.0, 38.0, 18.0, 17.0, 12.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2578125, -12.7325439453125, -12.207275390625, -11.6820068359375, -11.15673828125, -10.6314697265625, -10.106201171875, -9.5809326171875, -9.0556640625, -8.5303955078125, -8.005126953125, -7.4798583984375, -6.95458984375, -6.4293212890625, -5.904052734375, -5.3787841796875, -4.853515625, -4.3282470703125, -3.802978515625, -3.2777099609375, -2.75244140625, -2.2271728515625, -1.701904296875, -1.1766357421875, -0.6513671875, -0.1260986328125, 0.399169921875, 0.9244384765625, 1.44970703125, 1.9749755859375, 2.500244140625, 3.0255126953125, 3.55078125, 4.0760498046875, 4.601318359375, 5.1265869140625, 5.65185546875, 6.1771240234375, 6.702392578125, 7.2276611328125, 7.7529296875, 8.2781982421875, 8.803466796875, 9.3287353515625, 9.85400390625, 10.3792724609375, 10.904541015625, 11.4298095703125, 11.955078125, 12.4803466796875, 13.005615234375, 13.5308837890625, 14.05615234375, 14.5814208984375, 15.106689453125, 15.6319580078125, 16.1572265625, 16.6824951171875, 17.207763671875, 17.7330322265625, 18.25830078125, 18.7835693359375, 19.308837890625, 19.8341064453125, 20.359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 9.0, 20.0, 36.0, 73.0, 229.0, 3144.0, 422.0, 83.0, 38.0, 27.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96923828125, -0.8983078002929688, -0.8273773193359375, -0.7564468383789062, -0.685516357421875, -0.6145858764648438, -0.5436553955078125, -0.47272491455078125, -0.40179443359375, -0.33086395263671875, -0.2599334716796875, -0.18900299072265625, -0.118072509765625, -0.04714202880859375, 0.0237884521484375, 0.09471893310546875, 0.1656494140625, 0.23657989501953125, 0.3075103759765625, 0.37844085693359375, 0.449371337890625, 0.5203018188476562, 0.5912322998046875, 0.6621627807617188, 0.73309326171875, 0.8040237426757812, 0.8749542236328125, 0.9458847045898438, 1.016815185546875, 1.0877456665039062, 1.1586761474609375, 1.2296066284179688, 1.300537109375, 1.3714675903320312, 1.4423980712890625, 1.5133285522460938, 1.584259033203125, 1.6551895141601562, 1.7261199951171875, 1.7970504760742188, 1.86798095703125, 1.9389114379882812, 2.0098419189453125, 2.0807723999023438, 2.151702880859375, 2.2226333618164062, 2.2935638427734375, 2.3644943237304688, 2.4354248046875, 2.5063552856445312, 2.5772857666015625, 2.6482162475585938, 2.719146728515625, 2.7900772094726562, 2.8610076904296875, 2.9319381713867188, 3.00286865234375, 3.0737991333007812, 3.1447296142578125, 3.2156600952148438, 3.286590576171875, 3.3575210571289062, 3.4284515380859375, 3.4993820190429688, 3.5703125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 2.0, 4.0, 9.0, 25.0, 137.0, 500.0, 279.0, 41.0, 10.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.370308876037598, -3.716674566268921, -3.063040256500244, -2.4094061851501465, -1.7557718753814697, -1.102137565612793, -0.4485034942626953, 0.20513105392456055, 0.8587651252746582, 1.512399435043335, 2.1660337448120117, 2.8196678161621094, 3.473302125930786, 4.126936435699463, 4.7805705070495605, 5.434205055236816, 6.087839126586914, 6.741473197937012, 7.395107746124268, 8.048742294311523, 8.702376365661621, 9.356010437011719, 10.009644508361816, 10.663278579711914, 11.316913604736328, 11.970547676086426, 12.624181747436523, 13.277816772460938, 13.931450843811035, 14.585084915161133, 15.23871898651123, 15.892353057861328, 16.545988082885742, 17.199623107910156, 17.853256225585938, 18.50689125061035, 19.160524368286133, 19.814159393310547, 20.467792510986328, 21.121427536010742, 21.775062561035156, 22.42869758605957, 23.08233070373535, 23.735965728759766, 24.389598846435547, 25.04323387145996, 25.696868896484375, 26.350502014160156, 27.004135131835938, 27.65777015686035, 28.311403274536133, 28.965038299560547, 29.618671417236328, 30.272306442260742, 30.925941467285156, 31.579574584960938, 32.233211517333984, 32.886844635009766, 33.54048156738281, 34.194114685058594, 34.847747802734375, 35.501380920410156, 36.1550178527832, 36.808650970458984, 37.462284088134766]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 8.0, 19.0, 26.0, 56.0, 72.0, 115.0, 136.0, 139.0, 149.0, 101.0, 76.0, 55.0, 27.0, 16.0, 6.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.678271293640137, -12.310083389282227, -11.94189453125, -11.57370662689209, -11.205517768859863, -10.837329864501953, -10.469141006469727, -10.100953102111816, -9.732765197753906, -9.364577293395996, -8.99638843536377, -8.62820053100586, -8.260011672973633, -7.891823768615723, -7.523635387420654, -7.155447006225586, -6.787258148193359, -6.419069766998291, -6.050881385803223, -5.6826934814453125, -5.314504623413086, -4.946316719055176, -4.578128337860107, -4.209939956665039, -3.8417515754699707, -3.4735631942749023, -3.105374813079834, -2.7371866703033447, -2.3689982891082764, -2.000809907913208, -1.6326217651367188, -1.2644333839416504, -0.896245002746582, -0.5280566811561584, -0.15986835956573486, 0.20831990242004395, 0.5765082836151123, 0.9446966648101807, 1.31288480758667, 1.6810731887817383, 2.0492615699768066, 2.417449951171875, 2.7856383323669434, 3.1538264751434326, 3.522014856338501, 3.8902032375335693, 4.258391380310059, 4.626579761505127, 4.994768142700195, 5.362956523895264, 5.731144905090332, 6.099332809448242, 6.467521667480469, 6.835709571838379, 7.203897953033447, 7.572086334228516, 7.940274715423584, 8.308463096618652, 8.676651000976562, 9.044839859008789, 9.4130277633667, 9.781216621398926, 10.149404525756836, 10.517593383789062, 10.885781288146973]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 10.0, 10.0, 13.0, 10.0, 29.0, 32.0, 52.0, 83.0, 114.0, 261.0, 602.0, 1615.0, 5762.0, 34837.0, 373204.0, 567276.0, 53456.0, 7800.0, 1946.0, 733.0, 315.0, 135.0, 93.0, 59.0, 25.0, 22.0, 18.0, 13.0, 8.0, 6.0, 2.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.171875, -5.02020263671875, -4.8685302734375, -4.71685791015625, -4.565185546875, -4.41351318359375, -4.2618408203125, -4.11016845703125, -3.95849609375, -3.80682373046875, -3.6551513671875, -3.50347900390625, -3.351806640625, -3.20013427734375, -3.0484619140625, -2.89678955078125, -2.7451171875, -2.59344482421875, -2.4417724609375, -2.29010009765625, -2.138427734375, -1.98675537109375, -1.8350830078125, -1.68341064453125, -1.53173828125, -1.38006591796875, -1.2283935546875, -1.07672119140625, -0.925048828125, -0.77337646484375, -0.6217041015625, -0.47003173828125, -0.318359375, -0.16668701171875, -0.0150146484375, 0.13665771484375, 0.288330078125, 0.44000244140625, 0.5916748046875, 0.74334716796875, 0.89501953125, 1.04669189453125, 1.1983642578125, 1.35003662109375, 1.501708984375, 1.65338134765625, 1.8050537109375, 1.95672607421875, 2.1083984375, 2.26007080078125, 2.4117431640625, 2.56341552734375, 2.715087890625, 2.86676025390625, 3.0184326171875, 3.17010498046875, 3.32177734375, 3.47344970703125, 3.6251220703125, 3.77679443359375, 3.928466796875, 4.08013916015625, 4.2318115234375, 4.38348388671875, 4.53515625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 0.0, 10.0, 13.0, 28.0, 43.0, 89.0, 118.0, 151.0, 150.0, 130.0, 82.0, 61.0, 56.0, 36.0, 22.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.35791015625, -0.33626556396484375, -0.3146209716796875, -0.29297637939453125, -0.271331787109375, -0.24968719482421875, -0.2280426025390625, -0.20639801025390625, -0.18475341796875, -0.16310882568359375, -0.1414642333984375, -0.11981964111328125, -0.098175048828125, -0.07653045654296875, -0.0548858642578125, -0.03324127197265625, -0.0115966796875, 0.01004791259765625, 0.0316925048828125, 0.05333709716796875, 0.074981689453125, 0.09662628173828125, 0.1182708740234375, 0.13991546630859375, 0.16156005859375, 0.18320465087890625, 0.2048492431640625, 0.22649383544921875, 0.248138427734375, 0.26978302001953125, 0.2914276123046875, 0.31307220458984375, 0.334716796875, 0.35636138916015625, 0.3780059814453125, 0.39965057373046875, 0.421295166015625, 0.44293975830078125, 0.4645843505859375, 0.48622894287109375, 0.50787353515625, 0.5295181274414062, 0.5511627197265625, 0.5728073120117188, 0.594451904296875, 0.6160964965820312, 0.6377410888671875, 0.6593856811523438, 0.6810302734375, 0.7026748657226562, 0.7243194580078125, 0.7459640502929688, 0.767608642578125, 0.7892532348632812, 0.8108978271484375, 0.8325424194335938, 0.85418701171875, 0.8758316040039062, 0.8974761962890625, 0.9191207885742188, 0.940765380859375, 0.9624099731445312, 0.9840545654296875, 1.0056991577148438, 1.02734375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 6.0, 6.0, 9.0, 8.0, 14.0, 24.0, 29.0, 42.0, 62.0, 98.0, 149.0, 224.0, 380.0, 633.0, 1229.0, 2731.0, 6632.0, 17859.0, 56476.0, 221564.0, 505593.0, 165508.0, 44209.0, 14527.0, 5514.0, 2371.0, 1139.0, 568.0, 326.0, 198.0, 126.0, 84.0, 68.0, 42.0, 30.0, 19.0, 16.0, 15.0, 9.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.197265625, -2.12945556640625, -2.0616455078125, -1.99383544921875, -1.926025390625, -1.85821533203125, -1.7904052734375, -1.72259521484375, -1.65478515625, -1.58697509765625, -1.5191650390625, -1.45135498046875, -1.383544921875, -1.31573486328125, -1.2479248046875, -1.18011474609375, -1.1123046875, -1.04449462890625, -0.9766845703125, -0.90887451171875, -0.841064453125, -0.77325439453125, -0.7054443359375, -0.63763427734375, -0.56982421875, -0.50201416015625, -0.4342041015625, -0.36639404296875, -0.298583984375, -0.23077392578125, -0.1629638671875, -0.09515380859375, -0.02734375, 0.04046630859375, 0.1082763671875, 0.17608642578125, 0.243896484375, 0.31170654296875, 0.3795166015625, 0.44732666015625, 0.51513671875, 0.58294677734375, 0.6507568359375, 0.71856689453125, 0.786376953125, 0.85418701171875, 0.9219970703125, 0.98980712890625, 1.0576171875, 1.12542724609375, 1.1932373046875, 1.26104736328125, 1.328857421875, 1.39666748046875, 1.4644775390625, 1.53228759765625, 1.60009765625, 1.66790771484375, 1.7357177734375, 1.80352783203125, 1.871337890625, 1.93914794921875, 2.0069580078125, 2.07476806640625, 2.142578125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 7.0, 12.0, 7.0, 5.0, 10.0, 13.0, 17.0, 17.0, 32.0, 25.0, 27.0, 37.0, 29.0, 52.0, 45.0, 56.0, 48.0, 58.0, 45.0, 71.0, 49.0, 41.0, 42.0, 38.0, 36.0, 24.0, 21.0, 30.0, 21.0, 17.0, 12.0, 13.0, 7.0, 11.0, 7.0, 5.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3828125, -1.339996337890625, -1.29718017578125, -1.254364013671875, -1.2115478515625, -1.168731689453125, -1.12591552734375, -1.083099365234375, -1.040283203125, -0.997467041015625, -0.95465087890625, -0.911834716796875, -0.8690185546875, -0.826202392578125, -0.78338623046875, -0.740570068359375, -0.69775390625, -0.654937744140625, -0.61212158203125, -0.569305419921875, -0.5264892578125, -0.483673095703125, -0.44085693359375, -0.398040771484375, -0.355224609375, -0.312408447265625, -0.26959228515625, -0.226776123046875, -0.1839599609375, -0.141143798828125, -0.09832763671875, -0.055511474609375, -0.0126953125, 0.030120849609375, 0.07293701171875, 0.115753173828125, 0.1585693359375, 0.201385498046875, 0.24420166015625, 0.287017822265625, 0.329833984375, 0.372650146484375, 0.41546630859375, 0.458282470703125, 0.5010986328125, 0.543914794921875, 0.58673095703125, 0.629547119140625, 0.67236328125, 0.715179443359375, 0.75799560546875, 0.800811767578125, 0.8436279296875, 0.886444091796875, 0.92926025390625, 0.972076416015625, 1.014892578125, 1.057708740234375, 1.10052490234375, 1.143341064453125, 1.1861572265625, 1.228973388671875, 1.27178955078125, 1.314605712890625, 1.357421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 9.0, 15.0, 23.0, 41.0, 68.0, 153.0, 400.0, 1879.0, 29457.0, 998055.0, 16451.0, 1397.0, 316.0, 131.0, 74.0, 40.0, 18.0, 9.0, 7.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.640625, -8.4320068359375, -8.223388671875, -8.0147705078125, -7.80615234375, -7.5975341796875, -7.388916015625, -7.1802978515625, -6.9716796875, -6.7630615234375, -6.554443359375, -6.3458251953125, -6.13720703125, -5.9285888671875, -5.719970703125, -5.5113525390625, -5.302734375, -5.0941162109375, -4.885498046875, -4.6768798828125, -4.46826171875, -4.2596435546875, -4.051025390625, -3.8424072265625, -3.6337890625, -3.4251708984375, -3.216552734375, -3.0079345703125, -2.79931640625, -2.5906982421875, -2.382080078125, -2.1734619140625, -1.96484375, -1.7562255859375, -1.547607421875, -1.3389892578125, -1.13037109375, -0.9217529296875, -0.713134765625, -0.5045166015625, -0.2958984375, -0.0872802734375, 0.121337890625, 0.3299560546875, 0.53857421875, 0.7471923828125, 0.955810546875, 1.1644287109375, 1.373046875, 1.5816650390625, 1.790283203125, 1.9989013671875, 2.20751953125, 2.4161376953125, 2.624755859375, 2.8333740234375, 3.0419921875, 3.2506103515625, 3.459228515625, 3.6678466796875, 3.87646484375, 4.0850830078125, 4.293701171875, 4.5023193359375, 4.7109375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 5.0, 8.0, 7.0, 15.0, 14.0, 23.0, 40.0, 70.0, 75.0, 112.0, 110.0, 149.0, 113.0, 75.0, 55.0, 33.0, 22.0, 25.0, 9.0, 10.0, 9.0, 9.0, 1.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015783309936523438, -0.00015094876289367676, -0.00014406442642211914, -0.00013718008995056152, -0.0001302957534790039, -0.0001234114170074463, -0.00011652708053588867, -0.00010964274406433105, -0.00010275840759277344, -9.587407112121582e-05, -8.89897346496582e-05, -8.210539817810059e-05, -7.522106170654297e-05, -6.833672523498535e-05, -6.145238876342773e-05, -5.456805229187012e-05, -4.76837158203125e-05, -4.079937934875488e-05, -3.3915042877197266e-05, -2.703070640563965e-05, -2.014636993408203e-05, -1.3262033462524414e-05, -6.377696990966797e-06, 5.066394805908203e-07, 7.3909759521484375e-06, 1.4275312423706055e-05, 2.1159648895263672e-05, 2.804398536682129e-05, 3.4928321838378906e-05, 4.1812658309936523e-05, 4.869699478149414e-05, 5.558133125305176e-05, 6.246566772460938e-05, 6.935000419616699e-05, 7.623434066772461e-05, 8.311867713928223e-05, 9.000301361083984e-05, 9.688735008239746e-05, 0.00010377168655395508, 0.0001106560230255127, 0.00011754035949707031, 0.00012442469596862793, 0.00013130903244018555, 0.00013819336891174316, 0.00014507770538330078, 0.0001519620418548584, 0.00015884637832641602, 0.00016573071479797363, 0.00017261505126953125, 0.00017949938774108887, 0.00018638372421264648, 0.0001932680606842041, 0.00020015239715576172, 0.00020703673362731934, 0.00021392107009887695, 0.00022080540657043457, 0.0002276897430419922, 0.0002345740795135498, 0.00024145841598510742, 0.00024834275245666504, 0.00025522708892822266, 0.0002621114253997803, 0.0002689957618713379, 0.0002758800983428955, 0.0002827644348144531]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 5.0, 4.0, 14.0, 7.0, 12.0, 18.0, 28.0, 42.0, 39.0, 86.0, 181.0, 370.0, 826.0, 2480.0, 7785.0, 39783.0, 721234.0, 249435.0, 18570.0, 4813.0, 1587.0, 603.0, 255.0, 119.0, 71.0, 47.0, 16.0, 24.0, 21.0, 15.0, 12.0, 12.0, 7.0, 3.0, 6.0, 7.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.912109375, -2.823333740234375, -2.73455810546875, -2.645782470703125, -2.5570068359375, -2.468231201171875, -2.37945556640625, -2.290679931640625, -2.201904296875, -2.113128662109375, -2.02435302734375, -1.935577392578125, -1.8468017578125, -1.758026123046875, -1.66925048828125, -1.580474853515625, -1.49169921875, -1.402923583984375, -1.31414794921875, -1.225372314453125, -1.1365966796875, -1.047821044921875, -0.95904541015625, -0.870269775390625, -0.781494140625, -0.692718505859375, -0.60394287109375, -0.515167236328125, -0.4263916015625, -0.337615966796875, -0.24884033203125, -0.160064697265625, -0.0712890625, 0.017486572265625, 0.10626220703125, 0.195037841796875, 0.2838134765625, 0.372589111328125, 0.46136474609375, 0.550140380859375, 0.638916015625, 0.727691650390625, 0.81646728515625, 0.905242919921875, 0.9940185546875, 1.082794189453125, 1.17156982421875, 1.260345458984375, 1.34912109375, 1.437896728515625, 1.52667236328125, 1.615447998046875, 1.7042236328125, 1.792999267578125, 1.88177490234375, 1.970550537109375, 2.059326171875, 2.148101806640625, 2.23687744140625, 2.325653076171875, 2.4144287109375, 2.503204345703125, 2.59197998046875, 2.680755615234375, 2.76953125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 1.0, 5.0, 2.0, 7.0, 4.0, 1.0, 6.0, 13.0, 11.0, 20.0, 26.0, 34.0, 48.0, 93.0, 128.0, 129.0, 116.0, 106.0, 84.0, 57.0, 36.0, 20.0, 10.0, 5.0, 9.0, 5.0, 6.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-1.2646484375, -1.229248046875, -1.19384765625, -1.158447265625, -1.123046875, -1.087646484375, -1.05224609375, -1.016845703125, -0.9814453125, -0.946044921875, -0.91064453125, -0.875244140625, -0.83984375, -0.804443359375, -0.76904296875, -0.733642578125, -0.6982421875, -0.662841796875, -0.62744140625, -0.592041015625, -0.556640625, -0.521240234375, -0.48583984375, -0.450439453125, -0.4150390625, -0.379638671875, -0.34423828125, -0.308837890625, -0.2734375, -0.238037109375, -0.20263671875, -0.167236328125, -0.1318359375, -0.096435546875, -0.06103515625, -0.025634765625, 0.009765625, 0.045166015625, 0.08056640625, 0.115966796875, 0.1513671875, 0.186767578125, 0.22216796875, 0.257568359375, 0.29296875, 0.328369140625, 0.36376953125, 0.399169921875, 0.4345703125, 0.469970703125, 0.50537109375, 0.540771484375, 0.576171875, 0.611572265625, 0.64697265625, 0.682373046875, 0.7177734375, 0.753173828125, 0.78857421875, 0.823974609375, 0.859375, 0.894775390625, 0.93017578125, 0.965576171875, 1.0009765625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 9.0, 37.0, 102.0, 380.0, 353.0, 93.0, 20.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.837528228759766, -34.55546188354492, -33.27339553833008, -31.991331100463867, -30.709264755249023, -29.42719841003418, -28.14513397216797, -26.863067626953125, -25.58100128173828, -24.298934936523438, -23.016868591308594, -21.734804153442383, -20.45273780822754, -19.170671463012695, -17.888607025146484, -16.60654067993164, -15.324474334716797, -14.042407989501953, -12.760342597961426, -11.478277206420898, -10.196210861206055, -8.914144515991211, -7.632079124450684, -6.350013732910156, -5.0679473876953125, -3.785881519317627, -2.5038156509399414, -1.2217497825622559, 0.06031608581542969, 1.3423819541931152, 2.624447822570801, 3.906513214111328, 5.188575744628906, 6.470641613006592, 7.752707481384277, 9.034772872924805, 10.316839218139648, 11.598905563354492, 12.88097095489502, 14.163036346435547, 15.44510269165039, 16.727169036865234, 18.009235382080078, 19.29129981994629, 20.573366165161133, 21.855432510375977, 23.137496948242188, 24.41956329345703, 25.701629638671875, 26.98369598388672, 28.265762329101562, 29.547826766967773, 30.829893112182617, 32.11195755004883, 33.39402389526367, 34.676090240478516, 35.95815658569336, 37.2402229309082, 38.52228927612305, 39.80435562133789, 41.08641815185547, 42.36848449707031, 43.650550842285156, 44.9326171875, 46.214683532714844]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 6.0, 12.0, 11.0, 18.0, 18.0, 32.0, 34.0, 32.0, 45.0, 39.0, 57.0, 65.0, 64.0, 73.0, 69.0, 59.0, 61.0, 59.0, 47.0, 47.0, 25.0, 34.0, 22.0, 18.0, 21.0, 12.0, 10.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.64869213104248, -11.262978553771973, -10.877264976501465, -10.491551399230957, -10.10583782196045, -9.720124244689941, -9.33441162109375, -8.948698043823242, -8.562984466552734, -8.177270889282227, -7.791557312011719, -7.405843734741211, -7.020130157470703, -6.634416580200195, -6.248703479766846, -5.862989902496338, -5.477275848388672, -5.091562271118164, -4.705848693847656, -4.320135116577148, -3.9344217777252197, -3.548708200454712, -3.162994861602783, -2.7772812843322754, -2.3915677070617676, -2.0058541297912598, -1.6201406717300415, -1.2344272136688232, -0.8487136363983154, -0.4630000591278076, -0.0772867202758789, 0.3084268569946289, 0.6941394805908203, 1.0798530578613281, 1.4655665159225464, 1.8512799739837646, 2.2369935512542725, 2.6227071285247803, 3.008420467376709, 3.394134044647217, 3.7798476219177246, 4.165561199188232, 4.55127477645874, 4.93698787689209, 5.322701454162598, 5.7084150314331055, 6.094128608703613, 6.479842185974121, 6.865555763244629, 7.251269340515137, 7.6369829177856445, 8.022696495056152, 8.40841007232666, 8.794123649597168, 9.17983627319336, 9.565549850463867, 9.951263427734375, 10.336977005004883, 10.72269058227539, 11.108404159545898, 11.494117736816406, 11.879831314086914, 12.265544891357422, 12.65125846862793, 13.036972045898438]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 9.0, 18.0, 31.0, 89.0, 185.0, 457.0, 1203.0, 3676.0, 14241.0, 79652.0, 3818860.0, 237952.0, 27072.0, 6716.0, 2179.0, 831.0, 429.0, 229.0, 115.0, 74.0, 51.0, 40.0, 32.0, 22.0, 22.0, 16.0, 16.0, 17.0, 10.0, 5.0, 6.0, 9.0, 5.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2890625, -2.1221923828125, -1.955322265625, -1.7884521484375, -1.62158203125, -1.4547119140625, -1.287841796875, -1.1209716796875, -0.9541015625, -0.7872314453125, -0.620361328125, -0.4534912109375, -0.28662109375, -0.1197509765625, 0.047119140625, 0.2139892578125, 0.380859375, 0.5477294921875, 0.714599609375, 0.8814697265625, 1.04833984375, 1.2152099609375, 1.382080078125, 1.5489501953125, 1.7158203125, 1.8826904296875, 2.049560546875, 2.2164306640625, 2.38330078125, 2.5501708984375, 2.717041015625, 2.8839111328125, 3.05078125, 3.2176513671875, 3.384521484375, 3.5513916015625, 3.71826171875, 3.8851318359375, 4.052001953125, 4.2188720703125, 4.3857421875, 4.5526123046875, 4.719482421875, 4.8863525390625, 5.05322265625, 5.2200927734375, 5.386962890625, 5.5538330078125, 5.720703125, 5.8875732421875, 6.054443359375, 6.2213134765625, 6.38818359375, 6.5550537109375, 6.721923828125, 6.8887939453125, 7.0556640625, 7.2225341796875, 7.389404296875, 7.5562744140625, 7.72314453125, 7.8900146484375, 8.056884765625, 8.2237548828125, 8.390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 22.0, 34.0, 65.0, 85.0, 112.0, 124.0, 130.0, 117.0, 82.0, 82.0, 52.0, 30.0, 26.0, 14.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2578125, -0.2371063232421875, -0.216400146484375, -0.1956939697265625, -0.17498779296875, -0.1542816162109375, -0.133575439453125, -0.1128692626953125, -0.0921630859375, -0.0714569091796875, -0.050750732421875, -0.0300445556640625, -0.00933837890625, 0.0113677978515625, 0.032073974609375, 0.0527801513671875, 0.073486328125, 0.0941925048828125, 0.114898681640625, 0.1356048583984375, 0.15631103515625, 0.1770172119140625, 0.197723388671875, 0.2184295654296875, 0.2391357421875, 0.2598419189453125, 0.280548095703125, 0.3012542724609375, 0.32196044921875, 0.3426666259765625, 0.363372802734375, 0.3840789794921875, 0.40478515625, 0.4254913330078125, 0.446197509765625, 0.4669036865234375, 0.48760986328125, 0.5083160400390625, 0.529022216796875, 0.5497283935546875, 0.5704345703125, 0.5911407470703125, 0.611846923828125, 0.6325531005859375, 0.65325927734375, 0.6739654541015625, 0.694671630859375, 0.7153778076171875, 0.736083984375, 0.7567901611328125, 0.777496337890625, 0.7982025146484375, 0.81890869140625, 0.8396148681640625, 0.860321044921875, 0.8810272216796875, 0.9017333984375, 0.9224395751953125, 0.943145751953125, 0.9638519287109375, 0.98455810546875, 1.0052642822265625, 1.025970458984375, 1.0466766357421875, 1.0673828125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 14.0, 30.0, 55.0, 170.0, 690.0, 9572.0, 4158294.0, 24102.0, 884.0, 254.0, 116.0, 53.0, 27.0, 14.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.015625, -11.40234375, -10.7890625, -10.17578125, -9.5625, -8.94921875, -8.3359375, -7.72265625, -7.109375, -6.49609375, -5.8828125, -5.26953125, -4.65625, -4.04296875, -3.4296875, -2.81640625, -2.203125, -1.58984375, -0.9765625, -0.36328125, 0.25, 0.86328125, 1.4765625, 2.08984375, 2.703125, 3.31640625, 3.9296875, 4.54296875, 5.15625, 5.76953125, 6.3828125, 6.99609375, 7.609375, 8.22265625, 8.8359375, 9.44921875, 10.0625, 10.67578125, 11.2890625, 11.90234375, 12.515625, 13.12890625, 13.7421875, 14.35546875, 14.96875, 15.58203125, 16.1953125, 16.80859375, 17.421875, 18.03515625, 18.6484375, 19.26171875, 19.875, 20.48828125, 21.1015625, 21.71484375, 22.328125, 22.94140625, 23.5546875, 24.16796875, 24.78125, 25.39453125, 26.0078125, 26.62109375, 27.234375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 13.0, 24.0, 45.0, 81.0, 274.0, 3023.0, 421.0, 95.0, 48.0, 30.0, 10.0, 6.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -0.983245849609375, -0.91571044921875, -0.848175048828125, -0.7806396484375, -0.713104248046875, -0.64556884765625, -0.578033447265625, -0.510498046875, -0.442962646484375, -0.37542724609375, -0.307891845703125, -0.2403564453125, -0.172821044921875, -0.10528564453125, -0.037750244140625, 0.02978515625, 0.097320556640625, 0.16485595703125, 0.232391357421875, 0.2999267578125, 0.367462158203125, 0.43499755859375, 0.502532958984375, 0.570068359375, 0.637603759765625, 0.70513916015625, 0.772674560546875, 0.8402099609375, 0.907745361328125, 0.97528076171875, 1.042816162109375, 1.1103515625, 1.177886962890625, 1.24542236328125, 1.312957763671875, 1.3804931640625, 1.448028564453125, 1.51556396484375, 1.583099365234375, 1.650634765625, 1.718170166015625, 1.78570556640625, 1.853240966796875, 1.9207763671875, 1.988311767578125, 2.05584716796875, 2.123382568359375, 2.19091796875, 2.258453369140625, 2.32598876953125, 2.393524169921875, 2.4610595703125, 2.528594970703125, 2.59613037109375, 2.663665771484375, 2.731201171875, 2.798736572265625, 2.86627197265625, 2.933807373046875, 3.0013427734375, 3.068878173828125, 3.13641357421875, 3.203948974609375, 3.271484375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 10.0, 25.0, 70.0, 245.0, 356.0, 198.0, 58.0, 24.0, 9.0, 3.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.340940475463867, -7.929718971252441, -7.518497467041016, -7.10727596282959, -6.696053981781006, -6.28483247756958, -5.873610973358154, -5.46238899230957, -5.0511674880981445, -4.639945983886719, -4.228724479675293, -3.817502737045288, -3.406280994415283, -2.9950594902038574, -2.5838379859924316, -2.1726162433624268, -1.76139497756958, -1.3501733541488647, -0.9389517903327942, -0.5277302265167236, -0.1165086030960083, 0.29471302032470703, 0.7059345245361328, 1.1171562671661377, 1.5283777713775635, 1.9395993947982788, 2.350821018218994, 2.76204252243042, 3.1732640266418457, 3.5844857692718506, 3.9957072734832764, 4.406929016113281, 4.818150520324707, 5.229372024536133, 5.640593528747559, 6.051815032958984, 6.463037014007568, 6.874258518218994, 7.28548002243042, 7.696702003479004, 8.10792350769043, 8.519145011901855, 8.930366516113281, 9.341588020324707, 9.752809524536133, 10.164031982421875, 10.575252532958984, 10.986474990844727, 11.397695541381836, 11.808917045593262, 12.220138549804688, 12.631360054016113, 13.042581558227539, 13.453804016113281, 13.86502456665039, 14.276247024536133, 14.687468528747559, 15.098690032958984, 15.50991153717041, 15.921133041381836, 16.332355499267578, 16.743576049804688, 17.15479850769043, 17.56601905822754, 17.97724151611328]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 7.0, 8.0, 20.0, 27.0, 33.0, 54.0, 45.0, 75.0, 76.0, 72.0, 88.0, 103.0, 85.0, 75.0, 63.0, 60.0, 28.0, 21.0, 26.0, 15.0, 7.0, 6.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.4254045486450195, -5.222396373748779, -5.019388675689697, -4.816380500793457, -4.613372802734375, -4.410364627838135, -4.2073564529418945, -4.0043487548828125, -3.8013405799865723, -3.598332643508911, -3.39532470703125, -3.1923165321350098, -2.9893085956573486, -2.7863006591796875, -2.5832924842834473, -2.380284547805786, -2.177276611328125, -1.9742686748504639, -1.7712606191635132, -1.5682525634765625, -1.3652446269989014, -1.1622366905212402, -0.9592286348342896, -0.7562205791473389, -0.5532126426696777, -0.3502046465873718, -0.14719665050506592, 0.05581134557723999, 0.2588193416595459, 0.46182727813720703, 0.6648353338241577, 0.8678433895111084, 1.0708513259887695, 1.2738592624664307, 1.4768673181533813, 1.679875373840332, 1.8828833103179932, 2.0858912467956543, 2.2888994216918945, 2.4919073581695557, 2.694915294647217, 2.897923231124878, 3.100931167602539, 3.3039393424987793, 3.5069472789764404, 3.7099552154541016, 3.912963390350342, 4.115971565246582, 4.318979263305664, 4.521987438201904, 4.724995136260986, 4.928003311157227, 5.131011009216309, 5.334019184112549, 5.537027359008789, 5.740035057067871, 5.943043231964111, 6.146051406860352, 6.349059104919434, 6.552067279815674, 6.755075454711914, 6.958083152770996, 7.161091327667236, 7.364099502563477, 7.567107200622559]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 2.0, 10.0, 4.0, 12.0, 8.0, 16.0, 20.0, 31.0, 59.0, 48.0, 92.0, 116.0, 214.0, 377.0, 719.0, 1521.0, 3954.0, 12123.0, 47029.0, 228799.0, 541319.0, 162445.0, 34359.0, 9398.0, 3083.0, 1262.0, 575.0, 363.0, 190.0, 116.0, 83.0, 49.0, 33.0, 34.0, 18.0, 23.0, 7.0, 13.0, 9.0, 5.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.727569580078125, -2.64068603515625, -2.553802490234375, -2.4669189453125, -2.380035400390625, -2.29315185546875, -2.206268310546875, -2.119384765625, -2.032501220703125, -1.94561767578125, -1.858734130859375, -1.7718505859375, -1.684967041015625, -1.59808349609375, -1.511199951171875, -1.42431640625, -1.337432861328125, -1.25054931640625, -1.163665771484375, -1.0767822265625, -0.989898681640625, -0.90301513671875, -0.816131591796875, -0.729248046875, -0.642364501953125, -0.55548095703125, -0.468597412109375, -0.3817138671875, -0.294830322265625, -0.20794677734375, -0.121063232421875, -0.0341796875, 0.052703857421875, 0.13958740234375, 0.226470947265625, 0.3133544921875, 0.400238037109375, 0.48712158203125, 0.574005126953125, 0.660888671875, 0.747772216796875, 0.83465576171875, 0.921539306640625, 1.0084228515625, 1.095306396484375, 1.18218994140625, 1.269073486328125, 1.35595703125, 1.442840576171875, 1.52972412109375, 1.616607666015625, 1.7034912109375, 1.790374755859375, 1.87725830078125, 1.964141845703125, 2.051025390625, 2.137908935546875, 2.22479248046875, 2.311676025390625, 2.3985595703125, 2.485443115234375, 2.57232666015625, 2.659210205078125, 2.74609375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 7.0, 12.0, 25.0, 27.0, 70.0, 68.0, 102.0, 121.0, 135.0, 100.0, 91.0, 82.0, 56.0, 49.0, 18.0, 20.0, 13.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5498046875, -0.5255279541015625, -0.501251220703125, -0.4769744873046875, -0.45269775390625, -0.4284210205078125, -0.404144287109375, -0.3798675537109375, -0.3555908203125, -0.3313140869140625, -0.307037353515625, -0.2827606201171875, -0.25848388671875, -0.2342071533203125, -0.209930419921875, -0.1856536865234375, -0.161376953125, -0.1371002197265625, -0.112823486328125, -0.0885467529296875, -0.06427001953125, -0.0399932861328125, -0.015716552734375, 0.0085601806640625, 0.0328369140625, 0.0571136474609375, 0.081390380859375, 0.1056671142578125, 0.12994384765625, 0.1542205810546875, 0.178497314453125, 0.2027740478515625, 0.22705078125, 0.2513275146484375, 0.275604248046875, 0.2998809814453125, 0.32415771484375, 0.3484344482421875, 0.372711181640625, 0.3969879150390625, 0.4212646484375, 0.4455413818359375, 0.469818115234375, 0.4940948486328125, 0.51837158203125, 0.5426483154296875, 0.566925048828125, 0.5912017822265625, 0.615478515625, 0.6397552490234375, 0.664031982421875, 0.6883087158203125, 0.71258544921875, 0.7368621826171875, 0.761138916015625, 0.7854156494140625, 0.8096923828125, 0.8339691162109375, 0.858245849609375, 0.8825225830078125, 0.90679931640625, 0.9310760498046875, 0.955352783203125, 0.9796295166015625, 1.00390625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 7.0, 5.0, 11.0, 2.0, 10.0, 10.0, 18.0, 30.0, 40.0, 52.0, 83.0, 141.0, 253.0, 417.0, 769.0, 1549.0, 3176.0, 6949.0, 16410.0, 43462.0, 130057.0, 359882.0, 315118.0, 107266.0, 37062.0, 14052.0, 5982.0, 2747.0, 1320.0, 657.0, 420.0, 211.0, 133.0, 72.0, 46.0, 42.0, 23.0, 18.0, 21.0, 10.0, 4.0, 13.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7890625, -1.7363128662109375, -1.683563232421875, -1.6308135986328125, -1.57806396484375, -1.5253143310546875, -1.472564697265625, -1.4198150634765625, -1.3670654296875, -1.3143157958984375, -1.261566162109375, -1.2088165283203125, -1.15606689453125, -1.1033172607421875, -1.050567626953125, -0.9978179931640625, -0.945068359375, -0.8923187255859375, -0.839569091796875, -0.7868194580078125, -0.73406982421875, -0.6813201904296875, -0.628570556640625, -0.5758209228515625, -0.5230712890625, -0.4703216552734375, -0.417572021484375, -0.3648223876953125, -0.31207275390625, -0.2593231201171875, -0.206573486328125, -0.1538238525390625, -0.10107421875, -0.0483245849609375, 0.004425048828125, 0.0571746826171875, 0.10992431640625, 0.1626739501953125, 0.215423583984375, 0.2681732177734375, 0.3209228515625, 0.3736724853515625, 0.426422119140625, 0.4791717529296875, 0.53192138671875, 0.5846710205078125, 0.637420654296875, 0.6901702880859375, 0.742919921875, 0.7956695556640625, 0.848419189453125, 0.9011688232421875, 0.95391845703125, 1.0066680908203125, 1.059417724609375, 1.1121673583984375, 1.1649169921875, 1.2176666259765625, 1.270416259765625, 1.3231658935546875, 1.37591552734375, 1.4286651611328125, 1.481414794921875, 1.5341644287109375, 1.5869140625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 5.0, 9.0, 7.0, 14.0, 13.0, 17.0, 17.0, 28.0, 20.0, 16.0, 23.0, 23.0, 39.0, 37.0, 43.0, 48.0, 55.0, 47.0, 33.0, 35.0, 48.0, 36.0, 36.0, 56.0, 28.0, 30.0, 30.0, 26.0, 27.0, 23.0, 19.0, 19.0, 16.0, 10.0, 6.0, 10.0, 9.0, 5.0, 2.0, 10.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.439453125, -1.3928375244140625, -1.346221923828125, -1.2996063232421875, -1.25299072265625, -1.2063751220703125, -1.159759521484375, -1.1131439208984375, -1.0665283203125, -1.0199127197265625, -0.973297119140625, -0.9266815185546875, -0.88006591796875, -0.8334503173828125, -0.786834716796875, -0.7402191162109375, -0.693603515625, -0.6469879150390625, -0.600372314453125, -0.5537567138671875, -0.50714111328125, -0.4605255126953125, -0.413909912109375, -0.3672943115234375, -0.3206787109375, -0.2740631103515625, -0.227447509765625, -0.1808319091796875, -0.13421630859375, -0.0876007080078125, -0.040985107421875, 0.0056304931640625, 0.05224609375, 0.0988616943359375, 0.145477294921875, 0.1920928955078125, 0.23870849609375, 0.2853240966796875, 0.331939697265625, 0.3785552978515625, 0.4251708984375, 0.4717864990234375, 0.518402099609375, 0.5650177001953125, 0.61163330078125, 0.6582489013671875, 0.704864501953125, 0.7514801025390625, 0.798095703125, 0.8447113037109375, 0.891326904296875, 0.9379425048828125, 0.98455810546875, 1.0311737060546875, 1.077789306640625, 1.1244049072265625, 1.1710205078125, 1.2176361083984375, 1.264251708984375, 1.3108673095703125, 1.35748291015625, 1.4040985107421875, 1.450714111328125, 1.4973297119140625, 1.5439453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 8.0, 10.0, 26.0, 35.0, 52.0, 97.0, 152.0, 353.0, 759.0, 2042.0, 6332.0, 30178.0, 313664.0, 623343.0, 56729.0, 9959.0, 2867.0, 1011.0, 461.0, 213.0, 113.0, 49.0, 33.0, 18.0, 14.0, 9.0, 5.0, 1.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96142578125, -0.9112472534179688, -0.8610687255859375, -0.8108901977539062, -0.760711669921875, -0.7105331420898438, -0.6603546142578125, -0.6101760864257812, -0.55999755859375, -0.5098190307617188, -0.4596405029296875, -0.40946197509765625, -0.359283447265625, -0.30910491943359375, -0.2589263916015625, -0.20874786376953125, -0.1585693359375, -0.10839080810546875, -0.0582122802734375, -0.00803375244140625, 0.042144775390625, 0.09232330322265625, 0.1425018310546875, 0.19268035888671875, 0.24285888671875, 0.29303741455078125, 0.3432159423828125, 0.39339447021484375, 0.443572998046875, 0.49375152587890625, 0.5439300537109375, 0.5941085815429688, 0.644287109375, 0.6944656372070312, 0.7446441650390625, 0.7948226928710938, 0.845001220703125, 0.8951797485351562, 0.9453582763671875, 0.9955368041992188, 1.04571533203125, 1.0958938598632812, 1.1460723876953125, 1.1962509155273438, 1.246429443359375, 1.2966079711914062, 1.3467864990234375, 1.3969650268554688, 1.4471435546875, 1.4973220825195312, 1.5475006103515625, 1.5976791381835938, 1.647857666015625, 1.6980361938476562, 1.7482147216796875, 1.7983932495117188, 1.84857177734375, 1.8987503051757812, 1.9489288330078125, 1.9991073608398438, 2.049285888671875, 2.0994644165039062, 2.1496429443359375, 2.1998214721679688, 2.25]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 11.0, 7.0, 7.0, 6.0, 16.0, 15.0, 20.0, 21.0, 36.0, 40.0, 74.0, 74.0, 101.0, 118.0, 108.0, 88.0, 81.0, 46.0, 35.0, 20.0, 29.0, 10.0, 10.0, 13.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013256072998046875, -0.00012739747762680054, -0.00012223422527313232, -0.00011707097291946411, -0.0001119077205657959, -0.00010674446821212769, -0.00010158121585845947, -9.641796350479126e-05, -9.125471115112305e-05, -8.609145879745483e-05, -8.092820644378662e-05, -7.576495409011841e-05, -7.06017017364502e-05, -6.543844938278198e-05, -6.027519702911377e-05, -5.511194467544556e-05, -4.9948692321777344e-05, -4.478543996810913e-05, -3.962218761444092e-05, -3.4458935260772705e-05, -2.9295682907104492e-05, -2.413243055343628e-05, -1.8969178199768066e-05, -1.3805925846099854e-05, -8.64267349243164e-06, -3.4794211387634277e-06, 1.6838312149047852e-06, 6.847083568572998e-06, 1.2010335922241211e-05, 1.7173588275909424e-05, 2.2336840629577637e-05, 2.750009298324585e-05, 3.266334533691406e-05, 3.7826597690582275e-05, 4.298985004425049e-05, 4.81531023979187e-05, 5.3316354751586914e-05, 5.847960710525513e-05, 6.364285945892334e-05, 6.880611181259155e-05, 7.396936416625977e-05, 7.913261651992798e-05, 8.429586887359619e-05, 8.94591212272644e-05, 9.462237358093262e-05, 9.978562593460083e-05, 0.00010494887828826904, 0.00011011213064193726, 0.00011527538299560547, 0.00012043863534927368, 0.0001256018877029419, 0.0001307651400566101, 0.00013592839241027832, 0.00014109164476394653, 0.00014625489711761475, 0.00015141814947128296, 0.00015658140182495117, 0.00016174465417861938, 0.0001669079065322876, 0.0001720711588859558, 0.00017723441123962402, 0.00018239766359329224, 0.00018756091594696045, 0.00019272416830062866, 0.00019788742065429688]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 3.0, 8.0, 11.0, 18.0, 35.0, 38.0, 56.0, 114.0, 186.0, 349.0, 760.0, 1764.0, 5242.0, 21964.0, 183860.0, 738653.0, 76808.0, 12702.0, 3446.0, 1284.0, 568.0, 290.0, 149.0, 93.0, 40.0, 45.0, 15.0, 13.0, 10.0, 9.0, 4.0, 3.0, 2.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3916015625, -1.3366546630859375, -1.281707763671875, -1.2267608642578125, -1.17181396484375, -1.1168670654296875, -1.061920166015625, -1.0069732666015625, -0.9520263671875, -0.8970794677734375, -0.842132568359375, -0.7871856689453125, -0.73223876953125, -0.6772918701171875, -0.622344970703125, -0.5673980712890625, -0.512451171875, -0.4575042724609375, -0.402557373046875, -0.3476104736328125, -0.29266357421875, -0.2377166748046875, -0.182769775390625, -0.1278228759765625, -0.0728759765625, -0.0179290771484375, 0.037017822265625, 0.0919647216796875, 0.14691162109375, 0.2018585205078125, 0.256805419921875, 0.3117523193359375, 0.36669921875, 0.4216461181640625, 0.476593017578125, 0.5315399169921875, 0.58648681640625, 0.6414337158203125, 0.696380615234375, 0.7513275146484375, 0.8062744140625, 0.8612213134765625, 0.916168212890625, 0.9711151123046875, 1.02606201171875, 1.0810089111328125, 1.135955810546875, 1.1909027099609375, 1.245849609375, 1.3007965087890625, 1.355743408203125, 1.4106903076171875, 1.46563720703125, 1.5205841064453125, 1.575531005859375, 1.6304779052734375, 1.6854248046875, 1.7403717041015625, 1.795318603515625, 1.8502655029296875, 1.90521240234375, 1.9601593017578125, 2.015106201171875, 2.0700531005859375, 2.125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 2.0, 6.0, 10.0, 17.0, 14.0, 21.0, 37.0, 43.0, 65.0, 90.0, 141.0, 134.0, 118.0, 71.0, 70.0, 40.0, 26.0, 24.0, 17.0, 10.0, 9.0, 6.0, 8.0, 6.0, 2.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70166015625, -0.6689529418945312, -0.6362457275390625, -0.6035385131835938, -0.570831298828125, -0.5381240844726562, -0.5054168701171875, -0.47270965576171875, -0.44000244140625, -0.40729522705078125, -0.3745880126953125, -0.34188079833984375, -0.309173583984375, -0.27646636962890625, -0.2437591552734375, -0.21105194091796875, -0.1783447265625, -0.14563751220703125, -0.1129302978515625, -0.08022308349609375, -0.047515869140625, -0.01480865478515625, 0.0178985595703125, 0.05060577392578125, 0.08331298828125, 0.11602020263671875, 0.1487274169921875, 0.18143463134765625, 0.214141845703125, 0.24684906005859375, 0.2795562744140625, 0.31226348876953125, 0.344970703125, 0.37767791748046875, 0.4103851318359375, 0.44309234619140625, 0.475799560546875, 0.5085067749023438, 0.5412139892578125, 0.5739212036132812, 0.60662841796875, 0.6393356323242188, 0.6720428466796875, 0.7047500610351562, 0.737457275390625, 0.7701644897460938, 0.8028717041015625, 0.8355789184570312, 0.8682861328125, 0.9009933471679688, 0.9337005615234375, 0.9664077758789062, 0.999114990234375, 1.0318222045898438, 1.0645294189453125, 1.0972366333007812, 1.12994384765625, 1.1626510620117188, 1.1953582763671875, 1.2280654907226562, 1.260772705078125, 1.2934799194335938, 1.3261871337890625, 1.3588943481445312, 1.3916015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 12.0, 11.0, 31.0, 63.0, 149.0, 247.0, 247.0, 147.0, 53.0, 24.0, 16.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.719709396362305, -10.991731643676758, -10.263754844665527, -9.53577709197998, -8.80780029296875, -8.079822540283203, -7.351844787597656, -6.623867511749268, -5.895890235900879, -5.16791296005249, -4.439935684204102, -3.7119579315185547, -2.983980655670166, -2.2560033798217773, -1.5280256271362305, -0.8000483512878418, -0.07207107543945312, 0.6559063196182251, 1.3838837146759033, 2.111861228942871, 2.8398385047912598, 3.5678157806396484, 4.295793533325195, 5.023770809173584, 5.751748085021973, 6.479725360870361, 7.20770263671875, 7.935680389404297, 8.663658142089844, 9.391634941101074, 10.119612693786621, 10.847589492797852, 11.575565338134766, 12.303543090820312, 13.031519889831543, 13.75949764251709, 14.48747444152832, 15.215452194213867, 15.943429946899414, 16.67140769958496, 17.399383544921875, 18.127361297607422, 18.85533905029297, 19.583316802978516, 20.31129264831543, 21.039270401000977, 21.767248153686523, 22.49522590637207, 23.223203659057617, 23.951181411743164, 24.67915916442871, 25.407135009765625, 26.135112762451172, 26.86309051513672, 27.591068267822266, 28.319046020507812, 29.04702377319336, 29.775001525878906, 30.502979278564453, 31.23095703125, 31.958932876586914, 32.686912536621094, 33.414886474609375, 34.14286422729492, 34.87084197998047]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 0.0, 4.0, 7.0, 4.0, 8.0, 12.0, 10.0, 9.0, 11.0, 20.0, 28.0, 26.0, 34.0, 28.0, 36.0, 36.0, 45.0, 55.0, 53.0, 48.0, 47.0, 54.0, 47.0, 44.0, 41.0, 55.0, 26.0, 38.0, 35.0, 36.0, 18.0, 24.0, 18.0, 7.0, 13.0, 5.0, 7.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.843990325927734, -8.51794719696045, -8.191904067993164, -7.865861415863037, -7.539818286895752, -7.213775157928467, -6.88773250579834, -6.561689376831055, -6.2356462478637695, -5.909603118896484, -5.583559989929199, -5.257517337799072, -4.931474208831787, -4.605431079864502, -4.279388427734375, -3.95334529876709, -3.6273021697998047, -3.3012590408325195, -2.9752161502838135, -2.6491732597351074, -2.3231301307678223, -1.9970871210098267, -1.671044111251831, -1.345001220703125, -1.0189580917358398, -0.6929150819778442, -0.36687207221984863, -0.04082906246185303, 0.2852139472961426, 0.6112569570541382, 0.9372999668121338, 1.2633428573608398, 1.5893869400024414, 1.915429949760437, 2.2414729595184326, 2.5675158500671387, 2.893558979034424, 3.219602108001709, 3.545644998550415, 3.871687889099121, 4.197731018066406, 4.523774147033691, 4.849817276000977, 5.1758599281311035, 5.501903057098389, 5.827946186065674, 6.153988838195801, 6.480031967163086, 6.806075096130371, 7.132118225097656, 7.458161354064941, 7.784204006195068, 8.110246658325195, 8.43628978729248, 8.762332916259766, 9.08837604522705, 9.414419174194336, 9.740462303161621, 10.066505432128906, 10.392548561096191, 10.718591690063477, 11.044633865356445, 11.37067699432373, 11.696720123291016, 12.0227632522583]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 5.0, 12.0, 14.0, 31.0, 59.0, 106.0, 219.0, 441.0, 987.0, 2549.0, 8564.0, 39744.0, 3774099.0, 335647.0, 22506.0, 5631.0, 1869.0, 752.0, 337.0, 197.0, 158.0, 92.0, 61.0, 49.0, 38.0, 31.0, 18.0, 17.0, 16.0, 9.0, 6.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8046875, -2.6558837890625, -2.507080078125, -2.3582763671875, -2.20947265625, -2.0606689453125, -1.911865234375, -1.7630615234375, -1.6142578125, -1.4654541015625, -1.316650390625, -1.1678466796875, -1.01904296875, -0.8702392578125, -0.721435546875, -0.5726318359375, -0.423828125, -0.2750244140625, -0.126220703125, 0.0225830078125, 0.17138671875, 0.3201904296875, 0.468994140625, 0.6177978515625, 0.7666015625, 0.9154052734375, 1.064208984375, 1.2130126953125, 1.36181640625, 1.5106201171875, 1.659423828125, 1.8082275390625, 1.95703125, 2.1058349609375, 2.254638671875, 2.4034423828125, 2.55224609375, 2.7010498046875, 2.849853515625, 2.9986572265625, 3.1474609375, 3.2962646484375, 3.445068359375, 3.5938720703125, 3.74267578125, 3.8914794921875, 4.040283203125, 4.1890869140625, 4.337890625, 4.4866943359375, 4.635498046875, 4.7843017578125, 4.93310546875, 5.0819091796875, 5.230712890625, 5.3795166015625, 5.5283203125, 5.6771240234375, 5.825927734375, 5.9747314453125, 6.12353515625, 6.2723388671875, 6.421142578125, 6.5699462890625, 6.71875]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 2.0, 10.0, 20.0, 31.0, 42.0, 74.0, 58.0, 90.0, 106.0, 112.0, 98.0, 80.0, 72.0, 71.0, 40.0, 39.0, 15.0, 13.0, 10.0, 7.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4287109375, -0.40570068359375, -0.3826904296875, -0.35968017578125, -0.336669921875, -0.31365966796875, -0.2906494140625, -0.26763916015625, -0.24462890625, -0.22161865234375, -0.1986083984375, -0.17559814453125, -0.152587890625, -0.12957763671875, -0.1065673828125, -0.08355712890625, -0.060546875, -0.03753662109375, -0.0145263671875, 0.00848388671875, 0.031494140625, 0.05450439453125, 0.0775146484375, 0.10052490234375, 0.12353515625, 0.14654541015625, 0.1695556640625, 0.19256591796875, 0.215576171875, 0.23858642578125, 0.2615966796875, 0.28460693359375, 0.3076171875, 0.33062744140625, 0.3536376953125, 0.37664794921875, 0.399658203125, 0.42266845703125, 0.4456787109375, 0.46868896484375, 0.49169921875, 0.51470947265625, 0.5377197265625, 0.56072998046875, 0.583740234375, 0.60675048828125, 0.6297607421875, 0.65277099609375, 0.67578125, 0.69879150390625, 0.7218017578125, 0.74481201171875, 0.767822265625, 0.79083251953125, 0.8138427734375, 0.83685302734375, 0.85986328125, 0.88287353515625, 0.9058837890625, 0.92889404296875, 0.951904296875, 0.97491455078125, 0.9979248046875, 1.02093505859375, 1.0439453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 8.0, 17.0, 22.0, 35.0, 28.0, 48.0, 83.0, 209.0, 647.0, 2990.0, 27683.0, 4074519.0, 80706.0, 5470.0, 1120.0, 285.0, 137.0, 75.0, 63.0, 41.0, 33.0, 12.0, 16.0, 12.0, 8.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.17578125, -4.92510986328125, -4.6744384765625, -4.42376708984375, -4.173095703125, -3.92242431640625, -3.6717529296875, -3.42108154296875, -3.17041015625, -2.91973876953125, -2.6690673828125, -2.41839599609375, -2.167724609375, -1.91705322265625, -1.6663818359375, -1.41571044921875, -1.1650390625, -0.91436767578125, -0.6636962890625, -0.41302490234375, -0.162353515625, 0.08831787109375, 0.3389892578125, 0.58966064453125, 0.84033203125, 1.09100341796875, 1.3416748046875, 1.59234619140625, 1.843017578125, 2.09368896484375, 2.3443603515625, 2.59503173828125, 2.845703125, 3.09637451171875, 3.3470458984375, 3.59771728515625, 3.848388671875, 4.09906005859375, 4.3497314453125, 4.60040283203125, 4.85107421875, 5.10174560546875, 5.3524169921875, 5.60308837890625, 5.853759765625, 6.10443115234375, 6.3551025390625, 6.60577392578125, 6.8564453125, 7.10711669921875, 7.3577880859375, 7.60845947265625, 7.859130859375, 8.10980224609375, 8.3604736328125, 8.61114501953125, 8.86181640625, 9.11248779296875, 9.3631591796875, 9.61383056640625, 9.864501953125, 10.11517333984375, 10.3658447265625, 10.61651611328125, 10.8671875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 11.0, 23.0, 42.0, 120.0, 748.0, 2808.0, 187.0, 61.0, 32.0, 17.0, 8.0, 5.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85107421875, -0.7949905395507812, -0.7389068603515625, -0.6828231811523438, -0.626739501953125, -0.5706558227539062, -0.5145721435546875, -0.45848846435546875, -0.40240478515625, -0.34632110595703125, -0.2902374267578125, -0.23415374755859375, -0.178070068359375, -0.12198638916015625, -0.0659027099609375, -0.00981903076171875, 0.0462646484375, 0.10234832763671875, 0.1584320068359375, 0.21451568603515625, 0.270599365234375, 0.32668304443359375, 0.3827667236328125, 0.43885040283203125, 0.49493408203125, 0.5510177612304688, 0.6071014404296875, 0.6631851196289062, 0.719268798828125, 0.7753524780273438, 0.8314361572265625, 0.8875198364257812, 0.943603515625, 0.9996871948242188, 1.0557708740234375, 1.1118545532226562, 1.167938232421875, 1.2240219116210938, 1.2801055908203125, 1.3361892700195312, 1.39227294921875, 1.4483566284179688, 1.5044403076171875, 1.5605239868164062, 1.616607666015625, 1.6726913452148438, 1.7287750244140625, 1.7848587036132812, 1.8409423828125, 1.8970260620117188, 1.9531097412109375, 2.0091934204101562, 2.065277099609375, 2.1213607788085938, 2.1774444580078125, 2.2335281372070312, 2.28961181640625, 2.3456954956054688, 2.4017791748046875, 2.4578628540039062, 2.513946533203125, 2.5700302124023438, 2.6261138916015625, 2.6821975708007812, 2.73828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 9.0, 9.0, 25.0, 72.0, 183.0, 279.0, 234.0, 120.0, 29.0, 27.0, 8.0, 7.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5134382247924805, -4.243607044219971, -3.97377610206604, -3.7039451599121094, -3.4341139793395996, -3.16428279876709, -2.894451856613159, -2.6246209144592285, -2.3547897338867188, -2.084958553314209, -1.8151276111602783, -1.545296549797058, -1.275465488433838, -1.0056344270706177, -0.7358033657073975, -0.46597230434417725, -0.19614124298095703, 0.07368981838226318, 0.3435208797454834, 0.6133519411087036, 0.8831830024719238, 1.153014063835144, 1.4228451251983643, 1.6926761865615845, 1.9625072479248047, 2.2323384284973145, 2.502169370651245, 2.772000312805176, 3.0418314933776855, 3.3116626739501953, 3.581493616104126, 3.8513245582580566, 4.121156692504883, 4.390987873077393, 4.660819053649902, 4.930649757385254, 5.200480937957764, 5.470312118530273, 5.740142822265625, 6.009974002838135, 6.2798051834106445, 6.549636363983154, 6.819467544555664, 7.089298248291016, 7.359129428863525, 7.628960609436035, 7.898791313171387, 8.168622970581055, 8.438453674316406, 8.708284378051758, 8.978116035461426, 9.247946739196777, 9.517778396606445, 9.787609100341797, 10.057439804077148, 10.327271461486816, 10.597102165222168, 10.86693286895752, 11.136764526367188, 11.406595230102539, 11.67642593383789, 11.946257591247559, 12.21608829498291, 12.485919952392578, 12.75575065612793]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 13.0, 15.0, 26.0, 29.0, 39.0, 47.0, 33.0, 78.0, 75.0, 57.0, 80.0, 75.0, 67.0, 79.0, 52.0, 64.0, 47.0, 38.0, 22.0, 13.0, 13.0, 12.0, 6.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.226044654846191, -4.091172695159912, -3.9563004970550537, -3.8214282989501953, -3.686556339263916, -3.5516843795776367, -3.4168121814727783, -3.28193998336792, -3.1470680236816406, -3.0121960639953613, -2.877323865890503, -2.7424516677856445, -2.6075797080993652, -2.472707748413086, -2.3378355503082275, -2.202963352203369, -2.06809139251709, -1.933219313621521, -1.7983472347259521, -1.6634751558303833, -1.5286030769348145, -1.3937309980392456, -1.2588589191436768, -1.123986840248108, -0.9891147613525391, -0.8542426824569702, -0.7193706035614014, -0.5844985246658325, -0.44962644577026367, -0.3147543668746948, -0.17988228797912598, -0.04501020908355713, 0.08986186981201172, 0.22473394870758057, 0.3596060276031494, 0.49447810649871826, 0.6293501853942871, 0.764222264289856, 0.8990943431854248, 1.0339664220809937, 1.1688385009765625, 1.3037105798721313, 1.4385826587677002, 1.573454737663269, 1.708326816558838, 1.8431988954544067, 1.9780709743499756, 2.112943172454834, 2.2478151321411133, 2.3826870918273926, 2.517559289932251, 2.6524314880371094, 2.7873034477233887, 2.922175407409668, 3.0570476055145264, 3.1919198036193848, 3.326791763305664, 3.4616637229919434, 3.5965359210968018, 3.73140811920166, 3.8662800788879395, 4.001152038574219, 4.136024475097656, 4.2708964347839355, 4.405768394470215]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 7.0, 7.0, 11.0, 15.0, 14.0, 19.0, 32.0, 50.0, 80.0, 132.0, 198.0, 329.0, 619.0, 1457.0, 3626.0, 12893.0, 69568.0, 473530.0, 409968.0, 58753.0, 11236.0, 3285.0, 1270.0, 612.0, 321.0, 170.0, 112.0, 80.0, 46.0, 34.0, 19.0, 22.0, 10.0, 10.0, 10.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.982421875, -3.861572265625, -3.74072265625, -3.619873046875, -3.4990234375, -3.378173828125, -3.25732421875, -3.136474609375, -3.015625, -2.894775390625, -2.77392578125, -2.653076171875, -2.5322265625, -2.411376953125, -2.29052734375, -2.169677734375, -2.048828125, -1.927978515625, -1.80712890625, -1.686279296875, -1.5654296875, -1.444580078125, -1.32373046875, -1.202880859375, -1.08203125, -0.961181640625, -0.84033203125, -0.719482421875, -0.5986328125, -0.477783203125, -0.35693359375, -0.236083984375, -0.115234375, 0.005615234375, 0.12646484375, 0.247314453125, 0.3681640625, 0.489013671875, 0.60986328125, 0.730712890625, 0.8515625, 0.972412109375, 1.09326171875, 1.214111328125, 1.3349609375, 1.455810546875, 1.57666015625, 1.697509765625, 1.818359375, 1.939208984375, 2.06005859375, 2.180908203125, 2.3017578125, 2.422607421875, 2.54345703125, 2.664306640625, 2.78515625, 2.906005859375, 3.02685546875, 3.147705078125, 3.2685546875, 3.389404296875, 3.51025390625, 3.631103515625, 3.751953125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 2.0, 1.0, 4.0, 5.0, 16.0, 16.0, 30.0, 49.0, 53.0, 85.0, 68.0, 96.0, 85.0, 96.0, 80.0, 91.0, 69.0, 48.0, 41.0, 20.0, 17.0, 12.0, 6.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.475341796875, -0.4513893127441406, -0.42743682861328125, -0.4034843444824219, -0.3795318603515625, -0.3555793762207031, -0.33162689208984375, -0.3076744079589844, -0.283721923828125, -0.2597694396972656, -0.23581695556640625, -0.21186447143554688, -0.1879119873046875, -0.16395950317382812, -0.14000701904296875, -0.11605453491210938, -0.09210205078125, -0.06814956665039062, -0.04419708251953125, -0.020244598388671875, 0.0037078857421875, 0.027660369873046875, 0.05161285400390625, 0.07556533813476562, 0.099517822265625, 0.12347030639648438, 0.14742279052734375, 0.17137527465820312, 0.1953277587890625, 0.21928024291992188, 0.24323272705078125, 0.2671852111816406, 0.2911376953125, 0.3150901794433594, 0.33904266357421875, 0.3629951477050781, 0.3869476318359375, 0.4109001159667969, 0.43485260009765625, 0.4588050842285156, 0.482757568359375, 0.5067100524902344, 0.5306625366210938, 0.5546150207519531, 0.5785675048828125, 0.6025199890136719, 0.6264724731445312, 0.6504249572753906, 0.67437744140625, 0.6983299255371094, 0.7222824096679688, 0.7462348937988281, 0.7701873779296875, 0.7941398620605469, 0.8180923461914062, 0.8420448303222656, 0.865997314453125, 0.8899497985839844, 0.9139022827148438, 0.9378547668457031, 0.9618072509765625, 0.9857597351074219, 1.0097122192382812, 1.0336647033691406, 1.0576171875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 1.0, 4.0, 4.0, 6.0, 8.0, 16.0, 15.0, 22.0, 44.0, 63.0, 110.0, 182.0, 345.0, 665.0, 1384.0, 3409.0, 10043.0, 37061.0, 197689.0, 599673.0, 153248.0, 30583.0, 8469.0, 2933.0, 1233.0, 579.0, 304.0, 164.0, 94.0, 73.0, 36.0, 22.0, 16.0, 16.0, 17.0, 7.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.68359375, -2.589202880859375, -2.49481201171875, -2.400421142578125, -2.3060302734375, -2.211639404296875, -2.11724853515625, -2.022857666015625, -1.928466796875, -1.834075927734375, -1.73968505859375, -1.645294189453125, -1.5509033203125, -1.456512451171875, -1.36212158203125, -1.267730712890625, -1.17333984375, -1.078948974609375, -0.98455810546875, -0.890167236328125, -0.7957763671875, -0.701385498046875, -0.60699462890625, -0.512603759765625, -0.418212890625, -0.323822021484375, -0.22943115234375, -0.135040283203125, -0.0406494140625, 0.053741455078125, 0.14813232421875, 0.242523193359375, 0.3369140625, 0.431304931640625, 0.52569580078125, 0.620086669921875, 0.7144775390625, 0.808868408203125, 0.90325927734375, 0.997650146484375, 1.092041015625, 1.186431884765625, 1.28082275390625, 1.375213623046875, 1.4696044921875, 1.563995361328125, 1.65838623046875, 1.752777099609375, 1.84716796875, 1.941558837890625, 2.03594970703125, 2.130340576171875, 2.2247314453125, 2.319122314453125, 2.41351318359375, 2.507904052734375, 2.602294921875, 2.696685791015625, 2.79107666015625, 2.885467529296875, 2.9798583984375, 3.074249267578125, 3.16864013671875, 3.263031005859375, 3.357421875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 6.0, 5.0, 9.0, 19.0, 13.0, 26.0, 40.0, 26.0, 45.0, 50.0, 53.0, 71.0, 83.0, 85.0, 77.0, 61.0, 64.0, 50.0, 43.0, 36.0, 31.0, 26.0, 18.0, 11.0, 12.0, 4.0, 10.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.62890625, -2.533538818359375, -2.43817138671875, -2.342803955078125, -2.2474365234375, -2.152069091796875, -2.05670166015625, -1.961334228515625, -1.865966796875, -1.770599365234375, -1.67523193359375, -1.579864501953125, -1.4844970703125, -1.389129638671875, -1.29376220703125, -1.198394775390625, -1.10302734375, -1.007659912109375, -0.91229248046875, -0.816925048828125, -0.7215576171875, -0.626190185546875, -0.53082275390625, -0.435455322265625, -0.340087890625, -0.244720458984375, -0.14935302734375, -0.053985595703125, 0.0413818359375, 0.136749267578125, 0.23211669921875, 0.327484130859375, 0.4228515625, 0.518218994140625, 0.61358642578125, 0.708953857421875, 0.8043212890625, 0.899688720703125, 0.99505615234375, 1.090423583984375, 1.185791015625, 1.281158447265625, 1.37652587890625, 1.471893310546875, 1.5672607421875, 1.662628173828125, 1.75799560546875, 1.853363037109375, 1.94873046875, 2.044097900390625, 2.13946533203125, 2.234832763671875, 2.3302001953125, 2.425567626953125, 2.52093505859375, 2.616302490234375, 2.711669921875, 2.807037353515625, 2.90240478515625, 2.997772216796875, 3.0931396484375, 3.188507080078125, 3.28387451171875, 3.379241943359375, 3.474609375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 11.0, 14.0, 36.0, 43.0, 50.0, 92.0, 154.0, 298.0, 582.0, 1527.0, 5262.0, 35286.0, 716119.0, 267592.0, 16183.0, 3221.0, 1026.0, 445.0, 213.0, 139.0, 71.0, 52.0, 31.0, 25.0, 16.0, 16.0, 9.0, 8.0, 5.0, 4.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.3125, -2.24609375, -2.1796875, -2.11328125, -2.046875, -1.98046875, -1.9140625, -1.84765625, -1.78125, -1.71484375, -1.6484375, -1.58203125, -1.515625, -1.44921875, -1.3828125, -1.31640625, -1.25, -1.18359375, -1.1171875, -1.05078125, -0.984375, -0.91796875, -0.8515625, -0.78515625, -0.71875, -0.65234375, -0.5859375, -0.51953125, -0.453125, -0.38671875, -0.3203125, -0.25390625, -0.1875, -0.12109375, -0.0546875, 0.01171875, 0.078125, 0.14453125, 0.2109375, 0.27734375, 0.34375, 0.41015625, 0.4765625, 0.54296875, 0.609375, 0.67578125, 0.7421875, 0.80859375, 0.875, 0.94140625, 1.0078125, 1.07421875, 1.140625, 1.20703125, 1.2734375, 1.33984375, 1.40625, 1.47265625, 1.5390625, 1.60546875, 1.671875, 1.73828125, 1.8046875, 1.87109375, 1.9375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 6.0, 10.0, 5.0, 13.0, 15.0, 34.0, 54.0, 87.0, 120.0, 171.0, 161.0, 117.0, 77.0, 55.0, 26.0, 21.0, 16.0, 8.0, 7.0, 1.0, 2.0, 3.0, 0.0, 2.0], "bins": [-0.000415802001953125, -0.0004074620082974434, -0.0003991220146417618, -0.00039078202098608017, -0.00038244202733039856, -0.00037410203367471695, -0.00036576204001903534, -0.00035742204636335373, -0.0003490820527076721, -0.0003407420590519905, -0.0003324020653963089, -0.0003240620717406273, -0.0003157220780849457, -0.00030738208442926407, -0.00029904209077358246, -0.00029070209711790085, -0.00028236210346221924, -0.00027402210980653763, -0.000265682116150856, -0.0002573421224951744, -0.0002490021288394928, -0.0002406621351838112, -0.00023232214152812958, -0.00022398214787244797, -0.00021564215421676636, -0.00020730216056108475, -0.00019896216690540314, -0.00019062217324972153, -0.00018228217959403992, -0.0001739421859383583, -0.0001656021922826767, -0.0001572621986269951, -0.00014892220497131348, -0.00014058221131563187, -0.00013224221765995026, -0.00012390222400426865, -0.00011556223034858704, -0.00010722223669290543, -9.888224303722382e-05, -9.05422493815422e-05, -8.22022557258606e-05, -7.386226207017899e-05, -6.552226841449738e-05, -5.7182274758815765e-05, -4.8842281103134155e-05, -4.0502287447452545e-05, -3.2162293791770935e-05, -2.3822300136089325e-05, -1.5482306480407715e-05, -7.142312824726105e-06, 1.1976808309555054e-06, 9.537674486637115e-06, 1.7877668142318726e-05, 2.6217661798000336e-05, 3.4557655453681946e-05, 4.2897649109363556e-05, 5.1237642765045166e-05, 5.9577636420726776e-05, 6.791763007640839e-05, 7.625762373209e-05, 8.45976173877716e-05, 9.293761104345322e-05, 0.00010127760469913483, 0.00010961759835481644, 0.00011795759201049805]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 8.0, 8.0, 9.0, 19.0, 26.0, 48.0, 57.0, 128.0, 221.0, 582.0, 1492.0, 6557.0, 62331.0, 855151.0, 109551.0, 9143.0, 2015.0, 620.0, 255.0, 135.0, 74.0, 35.0, 26.0, 17.0, 15.0, 6.0, 12.0, 7.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.458984375, -1.38812255859375, -1.3172607421875, -1.24639892578125, -1.175537109375, -1.10467529296875, -1.0338134765625, -0.96295166015625, -0.89208984375, -0.82122802734375, -0.7503662109375, -0.67950439453125, -0.608642578125, -0.53778076171875, -0.4669189453125, -0.39605712890625, -0.3251953125, -0.25433349609375, -0.1834716796875, -0.11260986328125, -0.041748046875, 0.02911376953125, 0.0999755859375, 0.17083740234375, 0.24169921875, 0.31256103515625, 0.3834228515625, 0.45428466796875, 0.525146484375, 0.59600830078125, 0.6668701171875, 0.73773193359375, 0.80859375, 0.87945556640625, 0.9503173828125, 1.02117919921875, 1.092041015625, 1.16290283203125, 1.2337646484375, 1.30462646484375, 1.37548828125, 1.44635009765625, 1.5172119140625, 1.58807373046875, 1.658935546875, 1.72979736328125, 1.8006591796875, 1.87152099609375, 1.9423828125, 2.01324462890625, 2.0841064453125, 2.15496826171875, 2.225830078125, 2.29669189453125, 2.3675537109375, 2.43841552734375, 2.50927734375, 2.58013916015625, 2.6510009765625, 2.72186279296875, 2.792724609375, 2.86358642578125, 2.9344482421875, 3.00531005859375, 3.076171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 5.0, 11.0, 13.0, 15.0, 32.0, 38.0, 85.0, 136.0, 148.0, 170.0, 139.0, 85.0, 41.0, 39.0, 12.0, 12.0, 3.0, 4.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2412109375, -1.1968841552734375, -1.152557373046875, -1.1082305908203125, -1.06390380859375, -1.0195770263671875, -0.975250244140625, -0.9309234619140625, -0.8865966796875, -0.8422698974609375, -0.797943115234375, -0.7536163330078125, -0.70928955078125, -0.6649627685546875, -0.620635986328125, -0.5763092041015625, -0.531982421875, -0.4876556396484375, -0.443328857421875, -0.3990020751953125, -0.35467529296875, -0.3103485107421875, -0.266021728515625, -0.2216949462890625, -0.1773681640625, -0.1330413818359375, -0.088714599609375, -0.0443878173828125, -6.103515625e-05, 0.0442657470703125, 0.088592529296875, 0.1329193115234375, 0.17724609375, 0.2215728759765625, 0.265899658203125, 0.3102264404296875, 0.35455322265625, 0.3988800048828125, 0.443206787109375, 0.4875335693359375, 0.5318603515625, 0.5761871337890625, 0.620513916015625, 0.6648406982421875, 0.70916748046875, 0.7534942626953125, 0.797821044921875, 0.8421478271484375, 0.886474609375, 0.9308013916015625, 0.975128173828125, 1.0194549560546875, 1.06378173828125, 1.1081085205078125, 1.152435302734375, 1.1967620849609375, 1.2410888671875, 1.2854156494140625, 1.329742431640625, 1.3740692138671875, 1.41839599609375, 1.4627227783203125, 1.507049560546875, 1.5513763427734375, 1.595703125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 14.0, 15.0, 27.0, 58.0, 114.0, 201.0, 272.0, 177.0, 69.0, 32.0, 13.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.090682983398438, -18.230228424072266, -17.369773864746094, -16.509319305419922, -15.648863792419434, -14.788409233093262, -13.92795467376709, -13.067499160766602, -12.20704460144043, -11.346590042114258, -10.486135482788086, -9.625680923461914, -8.765225410461426, -7.904770851135254, -7.044316291809082, -6.183861255645752, -5.323407173156738, -4.462952613830566, -3.6024975776672363, -2.7420430183410645, -1.8815882205963135, -1.0211334228515625, -0.16067886352539062, 0.6997761726379395, 1.5602307319641113, 2.4206855297088623, 3.2811403274536133, 4.141594886779785, 5.002049446105957, 5.862504482269287, 6.722959041595459, 7.583414077758789, 8.443868637084961, 9.304323196411133, 10.164777755737305, 11.025232315063477, 11.885687828063965, 12.746142387390137, 13.606596946716309, 14.467052459716797, 15.327507019042969, 16.18796157836914, 17.048416137695312, 17.908870697021484, 18.769325256347656, 19.629779815673828, 20.490234375, 21.350690841674805, 22.211143493652344, 23.071598052978516, 23.932052612304688, 24.79250717163086, 25.65296173095703, 26.513416290283203, 27.373870849609375, 28.23432731628418, 29.09478187561035, 29.955236434936523, 30.815690994262695, 31.676145553588867, 32.53660202026367, 33.397056579589844, 34.257511138916016, 35.11796569824219, 35.97842025756836]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 10.0, 8.0, 4.0, 7.0, 12.0, 15.0, 12.0, 16.0, 16.0, 22.0, 22.0, 31.0, 28.0, 37.0, 34.0, 35.0, 46.0, 44.0, 50.0, 46.0, 44.0, 39.0, 45.0, 52.0, 52.0, 29.0, 43.0, 30.0, 26.0, 24.0, 18.0, 20.0, 16.0, 14.0, 13.0, 6.0, 6.0, 2.0, 6.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0], "bins": [-13.339420318603516, -12.921771049499512, -12.504121780395508, -12.08647346496582, -11.668824195861816, -11.251174926757812, -10.833526611328125, -10.415877342224121, -9.998228073120117, -9.580578804016113, -9.16292953491211, -8.745281219482422, -8.327631950378418, -7.909982681274414, -7.492333889007568, -7.074685096740723, -6.657035827636719, -6.239386558532715, -5.821737766265869, -5.404088973999023, -4.9864397048950195, -4.568790435791016, -4.15114164352417, -3.733492612838745, -3.3158435821533203, -2.8981945514678955, -2.4805455207824707, -2.062896490097046, -1.645247459411621, -1.2275984287261963, -0.8099493980407715, -0.3923003673553467, 0.02534770965576172, 0.4429967403411865, 0.8606457710266113, 1.2782948017120361, 1.695943832397461, 2.1135928630828857, 2.5312418937683105, 2.9488909244537354, 3.36653995513916, 3.784188985824585, 4.20183801651001, 4.6194868087768555, 5.037136077880859, 5.454785346984863, 5.872434139251709, 6.290082931518555, 6.707732200622559, 7.1253814697265625, 7.543030261993408, 7.960679054260254, 8.378328323364258, 8.795977592468262, 9.213626861572266, 9.631275177001953, 10.048924446105957, 10.466573715209961, 10.884222030639648, 11.301871299743652, 11.719520568847656, 12.13716983795166, 12.554819107055664, 12.972467422485352, 13.390116691589355]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 13.0, 17.0, 25.0, 37.0, 58.0, 111.0, 177.0, 305.0, 563.0, 1014.0, 2342.0, 5121.0, 12523.0, 38306.0, 199956.0, 3737382.0, 143553.0, 32099.0, 11122.0, 4598.0, 2169.0, 1043.0, 562.0, 311.0, 209.0, 137.0, 110.0, 78.0, 66.0, 45.0, 35.0, 31.0, 17.0, 15.0, 26.0, 14.0, 14.0, 14.0, 12.0, 12.0, 9.0, 8.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.68359375, -2.55841064453125, -2.4332275390625, -2.30804443359375, -2.182861328125, -2.05767822265625, -1.9324951171875, -1.80731201171875, -1.68212890625, -1.55694580078125, -1.4317626953125, -1.30657958984375, -1.181396484375, -1.05621337890625, -0.9310302734375, -0.80584716796875, -0.6806640625, -0.55548095703125, -0.4302978515625, -0.30511474609375, -0.179931640625, -0.05474853515625, 0.0704345703125, 0.19561767578125, 0.32080078125, 0.44598388671875, 0.5711669921875, 0.69635009765625, 0.821533203125, 0.94671630859375, 1.0718994140625, 1.19708251953125, 1.322265625, 1.44744873046875, 1.5726318359375, 1.69781494140625, 1.822998046875, 1.94818115234375, 2.0733642578125, 2.19854736328125, 2.32373046875, 2.44891357421875, 2.5740966796875, 2.69927978515625, 2.824462890625, 2.94964599609375, 3.0748291015625, 3.20001220703125, 3.3251953125, 3.45037841796875, 3.5755615234375, 3.70074462890625, 3.825927734375, 3.95111083984375, 4.0762939453125, 4.20147705078125, 4.32666015625, 4.45184326171875, 4.5770263671875, 4.70220947265625, 4.827392578125, 4.95257568359375, 5.0777587890625, 5.20294189453125, 5.328125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 4.0, 3.0, 1.0, 8.0, 9.0, 21.0, 26.0, 17.0, 49.0, 55.0, 59.0, 78.0, 96.0, 79.0, 110.0, 82.0, 76.0, 54.0, 57.0, 31.0, 26.0, 21.0, 24.0, 7.0, 7.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498291015625, -0.4732322692871094, -0.44817352294921875, -0.4231147766113281, -0.3980560302734375, -0.3729972839355469, -0.34793853759765625, -0.3228797912597656, -0.297821044921875, -0.2727622985839844, -0.24770355224609375, -0.22264480590820312, -0.1975860595703125, -0.17252731323242188, -0.14746856689453125, -0.12240982055664062, -0.09735107421875, -0.07229232788085938, -0.04723358154296875, -0.022174835205078125, 0.0028839111328125, 0.027942657470703125, 0.05300140380859375, 0.07806015014648438, 0.103118896484375, 0.12817764282226562, 0.15323638916015625, 0.17829513549804688, 0.2033538818359375, 0.22841262817382812, 0.25347137451171875, 0.2785301208496094, 0.3035888671875, 0.3286476135253906, 0.35370635986328125, 0.3787651062011719, 0.4038238525390625, 0.4288825988769531, 0.45394134521484375, 0.4790000915527344, 0.504058837890625, 0.5291175842285156, 0.5541763305664062, 0.5792350769042969, 0.6042938232421875, 0.6293525695800781, 0.6544113159179688, 0.6794700622558594, 0.70452880859375, 0.7295875549316406, 0.7546463012695312, 0.7797050476074219, 0.8047637939453125, 0.8298225402832031, 0.8548812866210938, 0.8799400329589844, 0.904998779296875, 0.9300575256347656, 0.9551162719726562, 0.9801750183105469, 1.0052337646484375, 1.0302925109863281, 1.0553512573242188, 1.0804100036621094, 1.10546875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 7.0, 2.0, 21.0, 38.0, 61.0, 83.0, 222.0, 760.0, 4839.0, 93761.0, 4065904.0, 24892.0, 2690.0, 555.0, 199.0, 99.0, 52.0, 32.0, 31.0, 17.0, 12.0, 4.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7734375, -9.402099609375, -9.03076171875, -8.659423828125, -8.2880859375, -7.916748046875, -7.54541015625, -7.174072265625, -6.802734375, -6.431396484375, -6.06005859375, -5.688720703125, -5.3173828125, -4.946044921875, -4.57470703125, -4.203369140625, -3.83203125, -3.460693359375, -3.08935546875, -2.718017578125, -2.3466796875, -1.975341796875, -1.60400390625, -1.232666015625, -0.861328125, -0.489990234375, -0.11865234375, 0.252685546875, 0.6240234375, 0.995361328125, 1.36669921875, 1.738037109375, 2.109375, 2.480712890625, 2.85205078125, 3.223388671875, 3.5947265625, 3.966064453125, 4.33740234375, 4.708740234375, 5.080078125, 5.451416015625, 5.82275390625, 6.194091796875, 6.5654296875, 6.936767578125, 7.30810546875, 7.679443359375, 8.05078125, 8.422119140625, 8.79345703125, 9.164794921875, 9.5361328125, 9.907470703125, 10.27880859375, 10.650146484375, 11.021484375, 11.392822265625, 11.76416015625, 12.135498046875, 12.5068359375, 12.878173828125, 13.24951171875, 13.620849609375, 13.9921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 7.0, 2.0, 12.0, 16.0, 17.0, 57.0, 105.0, 319.0, 2792.0, 497.0, 129.0, 46.0, 29.0, 17.0, 16.0, 5.0, 4.0, 9.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.009765625, -1.912322998046875, -1.81488037109375, -1.717437744140625, -1.6199951171875, -1.522552490234375, -1.42510986328125, -1.327667236328125, -1.230224609375, -1.132781982421875, -1.03533935546875, -0.937896728515625, -0.8404541015625, -0.743011474609375, -0.64556884765625, -0.548126220703125, -0.45068359375, -0.353240966796875, -0.25579833984375, -0.158355712890625, -0.0609130859375, 0.036529541015625, 0.13397216796875, 0.231414794921875, 0.328857421875, 0.426300048828125, 0.52374267578125, 0.621185302734375, 0.7186279296875, 0.816070556640625, 0.91351318359375, 1.010955810546875, 1.1083984375, 1.205841064453125, 1.30328369140625, 1.400726318359375, 1.4981689453125, 1.595611572265625, 1.69305419921875, 1.790496826171875, 1.887939453125, 1.985382080078125, 2.08282470703125, 2.180267333984375, 2.2777099609375, 2.375152587890625, 2.47259521484375, 2.570037841796875, 2.66748046875, 2.764923095703125, 2.86236572265625, 2.959808349609375, 3.0572509765625, 3.154693603515625, 3.25213623046875, 3.349578857421875, 3.447021484375, 3.544464111328125, 3.64190673828125, 3.739349365234375, 3.8367919921875, 3.934234619140625, 4.03167724609375, 4.129119873046875, 4.2265625]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 11.0, 23.0, 108.0, 429.0, 339.0, 75.0, 19.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.881589889526367, -7.990313529968262, -7.099037170410156, -6.207761287689209, -5.3164849281311035, -4.425208568572998, -3.533932685852051, -2.6426563262939453, -1.7513799667358398, -0.8601037263870239, 0.031172513961791992, 0.9224486351013184, 1.8137249946594238, 2.7050013542175293, 3.5962772369384766, 4.487553596496582, 5.3788299560546875, 6.270106315612793, 7.161382675170898, 8.052658081054688, 8.94393539428711, 9.835210800170898, 10.726487159729004, 11.61776351928711, 12.509039878845215, 13.40031623840332, 14.291592597961426, 15.182868957519531, 16.07414436340332, 16.965421676635742, 17.85669708251953, 18.747974395751953, 19.63924789428711, 20.5305233001709, 21.42180061340332, 22.31307601928711, 23.20435333251953, 24.09562873840332, 24.98690414428711, 25.87818145751953, 26.769458770751953, 27.660734176635742, 28.552011489868164, 29.443286895751953, 30.334564208984375, 31.225839614868164, 32.11711502075195, 33.008392333984375, 33.89966583251953, 34.79094314575195, 35.68221664428711, 36.57349395751953, 37.46477127075195, 38.356048583984375, 39.24732208251953, 40.13859939575195, 41.029876708984375, 41.9211540222168, 42.81242752075195, 43.703704833984375, 44.5949821472168, 45.48625946044922, 46.377532958984375, 47.2688102722168, 48.16008758544922]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 8.0, 7.0, 12.0, 25.0, 37.0, 53.0, 82.0, 91.0, 92.0, 139.0, 115.0, 97.0, 92.0, 58.0, 41.0, 27.0, 12.0, 15.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.755003929138184, -13.353261947631836, -12.951520919799805, -12.549778938293457, -12.14803695678711, -11.746295928955078, -11.34455394744873, -10.942811965942383, -10.541070938110352, -10.139328956604004, -9.737587928771973, -9.335845947265625, -8.934104919433594, -8.532362937927246, -8.130620956420898, -7.728879451751709, -7.3271379470825195, -6.92539644241333, -6.523654937744141, -6.121912956237793, -5.7201714515686035, -5.318429946899414, -4.916687965393066, -4.514946460723877, -4.1132049560546875, -3.711463451385498, -3.3097217082977295, -2.907979965209961, -2.5062384605407715, -2.104496955871582, -1.7027552127838135, -1.301013469696045, -0.8992710113525391, -0.49752938747406006, -0.09578776359558105, 0.30595386028289795, 0.707695484161377, 1.1094369888305664, 1.511178731918335, 1.9129204750061035, 2.314661979675293, 2.7164034843444824, 3.118145227432251, 3.5198869705200195, 3.921628475189209, 4.323369979858398, 4.725111961364746, 5.1268534660339355, 5.528594970703125, 5.9303364753723145, 6.332077980041504, 6.733819961547852, 7.135561466217041, 7.5373029708862305, 7.939044952392578, 8.34078598022461, 8.742527961730957, 9.144269943237305, 9.546010971069336, 9.947752952575684, 10.349494934082031, 10.751235961914062, 11.15297794342041, 11.554719924926758, 11.956460952758789]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 10.0, 6.0, 13.0, 16.0, 28.0, 30.0, 47.0, 56.0, 119.0, 172.0, 276.0, 554.0, 1266.0, 3456.0, 13024.0, 76959.0, 629175.0, 279285.0, 32954.0, 7052.0, 2149.0, 843.0, 410.0, 226.0, 128.0, 91.0, 53.0, 43.0, 27.0, 13.0, 17.0, 11.0, 12.0, 5.0, 9.0, 3.0, 1.0, 3.0, 8.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.689453125, -3.546356201171875, -3.40325927734375, -3.260162353515625, -3.1170654296875, -2.973968505859375, -2.83087158203125, -2.687774658203125, -2.544677734375, -2.401580810546875, -2.25848388671875, -2.115386962890625, -1.9722900390625, -1.829193115234375, -1.68609619140625, -1.542999267578125, -1.39990234375, -1.256805419921875, -1.11370849609375, -0.970611572265625, -0.8275146484375, -0.684417724609375, -0.54132080078125, -0.398223876953125, -0.255126953125, -0.112030029296875, 0.03106689453125, 0.174163818359375, 0.3172607421875, 0.460357666015625, 0.60345458984375, 0.746551513671875, 0.8896484375, 1.032745361328125, 1.17584228515625, 1.318939208984375, 1.4620361328125, 1.605133056640625, 1.74822998046875, 1.891326904296875, 2.034423828125, 2.177520751953125, 2.32061767578125, 2.463714599609375, 2.6068115234375, 2.749908447265625, 2.89300537109375, 3.036102294921875, 3.17919921875, 3.322296142578125, 3.46539306640625, 3.608489990234375, 3.7515869140625, 3.894683837890625, 4.03778076171875, 4.180877685546875, 4.323974609375, 4.467071533203125, 4.61016845703125, 4.753265380859375, 4.8963623046875, 5.039459228515625, 5.18255615234375, 5.325653076171875, 5.46875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 9.0, 14.0, 27.0, 40.0, 55.0, 93.0, 104.0, 138.0, 120.0, 107.0, 103.0, 90.0, 39.0, 28.0, 19.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80517578125, -0.7689285278320312, -0.7326812744140625, -0.6964340209960938, -0.660186767578125, -0.6239395141601562, -0.5876922607421875, -0.5514450073242188, -0.51519775390625, -0.47895050048828125, -0.4427032470703125, -0.40645599365234375, -0.370208740234375, -0.33396148681640625, -0.2977142333984375, -0.26146697998046875, -0.2252197265625, -0.18897247314453125, -0.1527252197265625, -0.11647796630859375, -0.080230712890625, -0.04398345947265625, -0.0077362060546875, 0.02851104736328125, 0.06475830078125, 0.10100555419921875, 0.1372528076171875, 0.17350006103515625, 0.209747314453125, 0.24599456787109375, 0.2822418212890625, 0.31848907470703125, 0.354736328125, 0.39098358154296875, 0.4272308349609375, 0.46347808837890625, 0.499725341796875, 0.5359725952148438, 0.5722198486328125, 0.6084671020507812, 0.64471435546875, 0.6809616088867188, 0.7172088623046875, 0.7534561157226562, 0.789703369140625, 0.8259506225585938, 0.8621978759765625, 0.8984451293945312, 0.9346923828125, 0.9709396362304688, 1.0071868896484375, 1.0434341430664062, 1.079681396484375, 1.1159286499023438, 1.1521759033203125, 1.1884231567382812, 1.22467041015625, 1.2609176635742188, 1.2971649169921875, 1.3334121704101562, 1.369659423828125, 1.4059066772460938, 1.4421539306640625, 1.4784011840820312, 1.5146484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 7.0, 16.0, 17.0, 34.0, 53.0, 82.0, 193.0, 459.0, 1260.0, 3900.0, 13710.0, 55863.0, 261678.0, 524692.0, 142187.0, 31884.0, 8293.0, 2622.0, 902.0, 356.0, 143.0, 70.0, 24.0, 27.0, 22.0, 16.0, 7.0, 4.0, 5.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.685546875, -2.607269287109375, -2.52899169921875, -2.450714111328125, -2.3724365234375, -2.294158935546875, -2.21588134765625, -2.137603759765625, -2.059326171875, -1.981048583984375, -1.90277099609375, -1.824493408203125, -1.7462158203125, -1.667938232421875, -1.58966064453125, -1.511383056640625, -1.43310546875, -1.354827880859375, -1.27655029296875, -1.198272705078125, -1.1199951171875, -1.041717529296875, -0.96343994140625, -0.885162353515625, -0.806884765625, -0.728607177734375, -0.65032958984375, -0.572052001953125, -0.4937744140625, -0.415496826171875, -0.33721923828125, -0.258941650390625, -0.1806640625, -0.102386474609375, -0.02410888671875, 0.054168701171875, 0.1324462890625, 0.210723876953125, 0.28900146484375, 0.367279052734375, 0.445556640625, 0.523834228515625, 0.60211181640625, 0.680389404296875, 0.7586669921875, 0.836944580078125, 0.91522216796875, 0.993499755859375, 1.07177734375, 1.150054931640625, 1.22833251953125, 1.306610107421875, 1.3848876953125, 1.463165283203125, 1.54144287109375, 1.619720458984375, 1.697998046875, 1.776275634765625, 1.85455322265625, 1.932830810546875, 2.0111083984375, 2.089385986328125, 2.16766357421875, 2.245941162109375, 2.32421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 4.0, 4.0, 7.0, 8.0, 5.0, 7.0, 14.0, 11.0, 24.0, 19.0, 23.0, 23.0, 31.0, 23.0, 27.0, 42.0, 45.0, 47.0, 41.0, 47.0, 45.0, 41.0, 45.0, 42.0, 50.0, 41.0, 46.0, 33.0, 39.0, 31.0, 26.0, 16.0, 24.0, 12.0, 13.0, 9.0, 7.0, 7.0, 10.0, 6.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.146484375, -2.083099365234375, -2.01971435546875, -1.956329345703125, -1.8929443359375, -1.829559326171875, -1.76617431640625, -1.702789306640625, -1.639404296875, -1.576019287109375, -1.51263427734375, -1.449249267578125, -1.3858642578125, -1.322479248046875, -1.25909423828125, -1.195709228515625, -1.13232421875, -1.068939208984375, -1.00555419921875, -0.942169189453125, -0.8787841796875, -0.815399169921875, -0.75201416015625, -0.688629150390625, -0.625244140625, -0.561859130859375, -0.49847412109375, -0.435089111328125, -0.3717041015625, -0.308319091796875, -0.24493408203125, -0.181549072265625, -0.1181640625, -0.054779052734375, 0.00860595703125, 0.071990966796875, 0.1353759765625, 0.198760986328125, 0.26214599609375, 0.325531005859375, 0.388916015625, 0.452301025390625, 0.51568603515625, 0.579071044921875, 0.6424560546875, 0.705841064453125, 0.76922607421875, 0.832611083984375, 0.89599609375, 0.959381103515625, 1.02276611328125, 1.086151123046875, 1.1495361328125, 1.212921142578125, 1.27630615234375, 1.339691162109375, 1.403076171875, 1.466461181640625, 1.52984619140625, 1.593231201171875, 1.6566162109375, 1.720001220703125, 1.78338623046875, 1.846771240234375, 1.91015625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 7.0, 3.0, 7.0, 12.0, 16.0, 22.0, 31.0, 59.0, 59.0, 111.0, 169.0, 290.0, 580.0, 1020.0, 2134.0, 5110.0, 13902.0, 51168.0, 315688.0, 533433.0, 90775.0, 21355.0, 6958.0, 2729.0, 1299.0, 688.0, 327.0, 217.0, 114.0, 81.0, 51.0, 39.0, 28.0, 18.0, 24.0, 12.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.08984375, -1.0537261962890625, -1.017608642578125, -0.9814910888671875, -0.94537353515625, -0.9092559814453125, -0.873138427734375, -0.8370208740234375, -0.8009033203125, -0.7647857666015625, -0.728668212890625, -0.6925506591796875, -0.65643310546875, -0.6203155517578125, -0.584197998046875, -0.5480804443359375, -0.511962890625, -0.4758453369140625, -0.439727783203125, -0.4036102294921875, -0.36749267578125, -0.3313751220703125, -0.295257568359375, -0.2591400146484375, -0.2230224609375, -0.1869049072265625, -0.150787353515625, -0.1146697998046875, -0.07855224609375, -0.0424346923828125, -0.006317138671875, 0.0298004150390625, 0.06591796875, 0.1020355224609375, 0.138153076171875, 0.1742706298828125, 0.21038818359375, 0.2465057373046875, 0.282623291015625, 0.3187408447265625, 0.3548583984375, 0.3909759521484375, 0.427093505859375, 0.4632110595703125, 0.49932861328125, 0.5354461669921875, 0.571563720703125, 0.6076812744140625, 0.643798828125, 0.6799163818359375, 0.716033935546875, 0.7521514892578125, 0.78826904296875, 0.8243865966796875, 0.860504150390625, 0.8966217041015625, 0.9327392578125, 0.9688568115234375, 1.004974365234375, 1.0410919189453125, 1.07720947265625, 1.1133270263671875, 1.149444580078125, 1.1855621337890625, 1.2216796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 7.0, 7.0, 23.0, 20.0, 30.0, 38.0, 59.0, 74.0, 101.0, 96.0, 119.0, 102.0, 81.0, 61.0, 61.0, 35.0, 28.0, 10.0, 11.0, 9.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00018453598022460938, -0.00017882511019706726, -0.00017311424016952515, -0.00016740337014198303, -0.00016169250011444092, -0.0001559816300868988, -0.0001502707600593567, -0.00014455989003181458, -0.00013884902000427246, -0.00013313814997673035, -0.00012742727994918823, -0.00012171640992164612, -0.000116005539894104, -0.00011029466986656189, -0.00010458379983901978, -9.887292981147766e-05, -9.316205978393555e-05, -8.745118975639343e-05, -8.174031972885132e-05, -7.60294497013092e-05, -7.031857967376709e-05, -6.460770964622498e-05, -5.889683961868286e-05, -5.318596959114075e-05, -4.747509956359863e-05, -4.176422953605652e-05, -3.6053359508514404e-05, -3.034248948097229e-05, -2.4631619453430176e-05, -1.892074942588806e-05, -1.3209879398345947e-05, -7.499009370803833e-06, -1.7881393432617188e-06, 3.9227306842803955e-06, 9.63360071182251e-06, 1.5344470739364624e-05, 2.1055340766906738e-05, 2.6766210794448853e-05, 3.247708082199097e-05, 3.818795084953308e-05, 4.3898820877075195e-05, 4.960969090461731e-05, 5.5320560932159424e-05, 6.103143095970154e-05, 6.674230098724365e-05, 7.245317101478577e-05, 7.816404104232788e-05, 8.387491106987e-05, 8.958578109741211e-05, 9.529665112495422e-05, 0.00010100752115249634, 0.00010671839118003845, 0.00011242926120758057, 0.00011814013123512268, 0.0001238510012626648, 0.0001295618712902069, 0.00013527274131774902, 0.00014098361134529114, 0.00014669448137283325, 0.00015240535140037537, 0.00015811622142791748, 0.0001638270914554596, 0.0001695379614830017, 0.00017524883151054382, 0.00018095970153808594]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 6.0, 11.0, 16.0, 34.0, 57.0, 106.0, 225.0, 391.0, 1065.0, 3505.0, 17864.0, 303769.0, 682950.0, 31224.0, 4967.0, 1355.0, 511.0, 224.0, 118.0, 62.0, 37.0, 21.0, 13.0, 8.0, 9.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.865234375, -1.791015625, -1.716796875, -1.642578125, -1.568359375, -1.494140625, -1.419921875, -1.345703125, -1.271484375, -1.197265625, -1.123046875, -1.048828125, -0.974609375, -0.900390625, -0.826171875, -0.751953125, -0.677734375, -0.603515625, -0.529296875, -0.455078125, -0.380859375, -0.306640625, -0.232421875, -0.158203125, -0.083984375, -0.009765625, 0.064453125, 0.138671875, 0.212890625, 0.287109375, 0.361328125, 0.435546875, 0.509765625, 0.583984375, 0.658203125, 0.732421875, 0.806640625, 0.880859375, 0.955078125, 1.029296875, 1.103515625, 1.177734375, 1.251953125, 1.326171875, 1.400390625, 1.474609375, 1.548828125, 1.623046875, 1.697265625, 1.771484375, 1.845703125, 1.919921875, 1.994140625, 2.068359375, 2.142578125, 2.216796875, 2.291015625, 2.365234375, 2.439453125, 2.513671875, 2.587890625, 2.662109375, 2.736328125, 2.810546875, 2.884765625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 7.0, 14.0, 11.0, 9.0, 34.0, 50.0, 89.0, 121.0, 163.0, 146.0, 111.0, 86.0, 53.0, 34.0, 18.0, 12.0, 8.0, 8.0, 6.0, 8.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.15234375, -1.1081390380859375, -1.063934326171875, -1.0197296142578125, -0.97552490234375, -0.9313201904296875, -0.887115478515625, -0.8429107666015625, -0.7987060546875, -0.7545013427734375, -0.710296630859375, -0.6660919189453125, -0.62188720703125, -0.5776824951171875, -0.533477783203125, -0.4892730712890625, -0.445068359375, -0.4008636474609375, -0.356658935546875, -0.3124542236328125, -0.26824951171875, -0.2240447998046875, -0.179840087890625, -0.1356353759765625, -0.0914306640625, -0.0472259521484375, -0.003021240234375, 0.0411834716796875, 0.08538818359375, 0.1295928955078125, 0.173797607421875, 0.2180023193359375, 0.26220703125, 0.3064117431640625, 0.350616455078125, 0.3948211669921875, 0.43902587890625, 0.4832305908203125, 0.527435302734375, 0.5716400146484375, 0.6158447265625, 0.6600494384765625, 0.704254150390625, 0.7484588623046875, 0.79266357421875, 0.8368682861328125, 0.881072998046875, 0.9252777099609375, 0.969482421875, 1.0136871337890625, 1.057891845703125, 1.1020965576171875, 1.14630126953125, 1.1905059814453125, 1.234710693359375, 1.2789154052734375, 1.3231201171875, 1.3673248291015625, 1.411529541015625, 1.4557342529296875, 1.49993896484375, 1.5441436767578125, 1.588348388671875, 1.6325531005859375, 1.6767578125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 6.0, 12.0, 14.0, 37.0, 66.0, 116.0, 198.0, 238.0, 156.0, 76.0, 46.0, 19.0, 8.0, 4.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.41752815246582, -9.742835998535156, -9.068144798278809, -8.393452644348145, -7.718760967254639, -7.044069290161133, -6.369377136230469, -5.694685459136963, -5.019993782043457, -4.345302104949951, -3.670610189437866, -2.9959182739257812, -2.3212265968322754, -1.6465349197387695, -0.9718427658081055, -0.2971510887145996, 0.37754058837890625, 1.0522323846817017, 1.726924180984497, 2.401616096496582, 3.076307773590088, 3.7509994506835938, 4.425691604614258, 5.100383281707764, 5.7750749588012695, 6.449766635894775, 7.124458312988281, 7.799150466918945, 8.47384262084961, 9.148533821105957, 9.823225975036621, 10.497917175292969, 11.172611236572266, 11.84730339050293, 12.521994590759277, 13.196686744689941, 13.871377944946289, 14.546070098876953, 15.220762252807617, 15.895454406738281, 16.570144653320312, 17.244836807250977, 17.91952896118164, 18.594219207763672, 19.268911361694336, 19.943603515625, 20.618295669555664, 21.292987823486328, 21.967679977416992, 22.642372131347656, 23.31706428527832, 23.991756439208984, 24.666446685791016, 25.34113883972168, 26.015830993652344, 26.690523147583008, 27.365215301513672, 28.039907455444336, 28.714599609375, 29.38928985595703, 30.063982009887695, 30.73867416381836, 31.413366317749023, 32.08805847167969, 32.76274871826172]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 10.0, 7.0, 14.0, 18.0, 21.0, 34.0, 26.0, 38.0, 47.0, 55.0, 46.0, 70.0, 76.0, 61.0, 72.0, 45.0, 62.0, 56.0, 38.0, 38.0, 39.0, 24.0, 25.0, 12.0, 16.0, 8.0, 9.0, 7.0, 3.0, 5.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.787322044372559, -13.250826835632324, -12.71433162689209, -12.177836418151855, -11.641341209411621, -11.104846000671387, -10.568350791931152, -10.031855583190918, -9.495360374450684, -8.95886516571045, -8.422369956970215, -7.8858747482299805, -7.349379539489746, -6.812884330749512, -6.276389122009277, -5.739893913269043, -5.203398704528809, -4.666903495788574, -4.13040828704834, -3.5939130783081055, -3.057417869567871, -2.5209226608276367, -1.9844274520874023, -1.447932243347168, -0.9114370346069336, -0.3749418258666992, 0.16155338287353516, 0.6980485916137695, 1.234543800354004, 1.7710390090942383, 2.3075342178344727, 2.844029426574707, 3.380523681640625, 3.9170188903808594, 4.453514099121094, 4.990009307861328, 5.5265045166015625, 6.062999725341797, 6.599494934082031, 7.135990142822266, 7.6724853515625, 8.208980560302734, 8.745475769042969, 9.281970977783203, 9.818466186523438, 10.354961395263672, 10.891456604003906, 11.42795181274414, 11.964447021484375, 12.50094223022461, 13.037437438964844, 13.573932647705078, 14.110427856445312, 14.646923065185547, 15.183418273925781, 15.719913482666016, 16.25640869140625, 16.792903900146484, 17.32939910888672, 17.865894317626953, 18.402389526367188, 18.938884735107422, 19.475379943847656, 20.01187515258789, 20.548370361328125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 9.0, 13.0, 27.0, 44.0, 56.0, 130.0, 228.0, 476.0, 1120.0, 3303.0, 13279.0, 133217.0, 3992514.0, 38811.0, 7305.0, 1965.0, 760.0, 374.0, 193.0, 146.0, 83.0, 62.0, 33.0, 28.0, 18.0, 10.0, 16.0, 13.0, 7.0, 5.0, 3.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.630859375, -3.467987060546875, -3.30511474609375, -3.142242431640625, -2.9793701171875, -2.816497802734375, -2.65362548828125, -2.490753173828125, -2.327880859375, -2.165008544921875, -2.00213623046875, -1.839263916015625, -1.6763916015625, -1.513519287109375, -1.35064697265625, -1.187774658203125, -1.02490234375, -0.862030029296875, -0.69915771484375, -0.536285400390625, -0.3734130859375, -0.210540771484375, -0.04766845703125, 0.115203857421875, 0.278076171875, 0.440948486328125, 0.60382080078125, 0.766693115234375, 0.9295654296875, 1.092437744140625, 1.25531005859375, 1.418182373046875, 1.5810546875, 1.743927001953125, 1.90679931640625, 2.069671630859375, 2.2325439453125, 2.395416259765625, 2.55828857421875, 2.721160888671875, 2.884033203125, 3.046905517578125, 3.20977783203125, 3.372650146484375, 3.5355224609375, 3.698394775390625, 3.86126708984375, 4.024139404296875, 4.18701171875, 4.349884033203125, 4.51275634765625, 4.675628662109375, 4.8385009765625, 5.001373291015625, 5.16424560546875, 5.327117919921875, 5.489990234375, 5.652862548828125, 5.81573486328125, 5.978607177734375, 6.1414794921875, 6.304351806640625, 6.46722412109375, 6.630096435546875, 6.79296875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 2.0, 8.0, 8.0, 16.0, 29.0, 49.0, 73.0, 88.0, 111.0, 121.0, 96.0, 111.0, 89.0, 78.0, 40.0, 33.0, 26.0, 15.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7802734375, -0.7451019287109375, -0.709930419921875, -0.6747589111328125, -0.63958740234375, -0.6044158935546875, -0.569244384765625, -0.5340728759765625, -0.4989013671875, -0.4637298583984375, -0.428558349609375, -0.3933868408203125, -0.35821533203125, -0.3230438232421875, -0.287872314453125, -0.2527008056640625, -0.217529296875, -0.1823577880859375, -0.147186279296875, -0.1120147705078125, -0.07684326171875, -0.0416717529296875, -0.006500244140625, 0.0286712646484375, 0.0638427734375, 0.0990142822265625, 0.134185791015625, 0.1693572998046875, 0.20452880859375, 0.2397003173828125, 0.274871826171875, 0.3100433349609375, 0.34521484375, 0.3803863525390625, 0.415557861328125, 0.4507293701171875, 0.48590087890625, 0.5210723876953125, 0.556243896484375, 0.5914154052734375, 0.6265869140625, 0.6617584228515625, 0.696929931640625, 0.7321014404296875, 0.76727294921875, 0.8024444580078125, 0.837615966796875, 0.8727874755859375, 0.907958984375, 0.9431304931640625, 0.978302001953125, 1.0134735107421875, 1.04864501953125, 1.0838165283203125, 1.118988037109375, 1.1541595458984375, 1.1893310546875, 1.2245025634765625, 1.259674072265625, 1.2948455810546875, 1.33001708984375, 1.3651885986328125, 1.400360107421875, 1.4355316162109375, 1.470703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 4.0, 9.0, 8.0, 14.0, 14.0, 21.0, 23.0, 32.0, 49.0, 45.0, 65.0, 133.0, 240.0, 570.0, 1749.0, 6256.0, 31838.0, 3603689.0, 521116.0, 21549.0, 4576.0, 1342.0, 459.0, 168.0, 85.0, 40.0, 40.0, 28.0, 22.0, 30.0, 15.0, 9.0, 8.0, 10.0, 3.0, 4.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-5.765625, -5.613494873046875, -5.46136474609375, -5.309234619140625, -5.1571044921875, -5.004974365234375, -4.85284423828125, -4.700714111328125, -4.548583984375, -4.396453857421875, -4.24432373046875, -4.092193603515625, -3.9400634765625, -3.787933349609375, -3.63580322265625, -3.483673095703125, -3.33154296875, -3.179412841796875, -3.02728271484375, -2.875152587890625, -2.7230224609375, -2.570892333984375, -2.41876220703125, -2.266632080078125, -2.114501953125, -1.962371826171875, -1.81024169921875, -1.658111572265625, -1.5059814453125, -1.353851318359375, -1.20172119140625, -1.049591064453125, -0.8974609375, -0.745330810546875, -0.59320068359375, -0.441070556640625, -0.2889404296875, -0.136810302734375, 0.01531982421875, 0.167449951171875, 0.319580078125, 0.471710205078125, 0.62384033203125, 0.775970458984375, 0.9281005859375, 1.080230712890625, 1.23236083984375, 1.384490966796875, 1.53662109375, 1.688751220703125, 1.84088134765625, 1.993011474609375, 2.1451416015625, 2.297271728515625, 2.44940185546875, 2.601531982421875, 2.753662109375, 2.905792236328125, 3.05792236328125, 3.210052490234375, 3.3621826171875, 3.514312744140625, 3.66644287109375, 3.818572998046875, 3.970703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 5.0, 7.0, 7.0, 9.0, 4.0, 22.0, 20.0, 65.0, 168.0, 1043.0, 2336.0, 212.0, 83.0, 38.0, 20.0, 17.0, 10.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0], "bins": [-2.56640625, -2.511932373046875, -2.45745849609375, -2.402984619140625, -2.3485107421875, -2.294036865234375, -2.23956298828125, -2.185089111328125, -2.130615234375, -2.076141357421875, -2.02166748046875, -1.967193603515625, -1.9127197265625, -1.858245849609375, -1.80377197265625, -1.749298095703125, -1.69482421875, -1.640350341796875, -1.58587646484375, -1.531402587890625, -1.4769287109375, -1.422454833984375, -1.36798095703125, -1.313507080078125, -1.259033203125, -1.204559326171875, -1.15008544921875, -1.095611572265625, -1.0411376953125, -0.986663818359375, -0.93218994140625, -0.877716064453125, -0.8232421875, -0.768768310546875, -0.71429443359375, -0.659820556640625, -0.6053466796875, -0.550872802734375, -0.49639892578125, -0.441925048828125, -0.387451171875, -0.332977294921875, -0.27850341796875, -0.224029541015625, -0.1695556640625, -0.115081787109375, -0.06060791015625, -0.006134033203125, 0.04833984375, 0.102813720703125, 0.15728759765625, 0.211761474609375, 0.2662353515625, 0.320709228515625, 0.37518310546875, 0.429656982421875, 0.484130859375, 0.538604736328125, 0.59307861328125, 0.647552490234375, 0.7020263671875, 0.756500244140625, 0.81097412109375, 0.865447998046875, 0.919921875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 10.0, 21.0, 80.0, 268.0, 423.0, 166.0, 33.0, 9.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.32050323486328, -21.739404678344727, -21.158306121826172, -20.577205657958984, -19.99610710144043, -19.415008544921875, -18.83390998840332, -18.252811431884766, -17.671710968017578, -17.090612411499023, -16.50951385498047, -15.928414344787598, -15.347314834594727, -14.766216278076172, -14.185117721557617, -13.604018211364746, -13.022919654846191, -12.441821098327637, -11.860721588134766, -11.279623031616211, -10.69852352142334, -10.117424964904785, -9.536325454711914, -8.95522689819336, -8.374128341674805, -7.793029308319092, -7.211930274963379, -6.630831718444824, -6.049732208251953, -5.468633651733398, -4.8875346183776855, -4.306435585021973, -3.725337028503418, -3.144237995147705, -2.563138961791992, -1.9820401668548584, -1.4009411334991455, -0.8198421001434326, -0.23874330520629883, 0.34235572814941406, 0.923454761505127, 1.5045537948608398, 2.0856528282165527, 2.6667516231536865, 3.2478506565093994, 3.8289496898651123, 4.410048484802246, 4.991147518157959, 5.572246551513672, 6.153345584869385, 6.734444618225098, 7.315543174743652, 7.896642684936523, 8.477741241455078, 9.058839797973633, 9.639939308166504, 10.221038818359375, 10.80213737487793, 11.3832368850708, 11.964335441589355, 12.545434951782227, 13.126533508300781, 13.707632064819336, 14.288731575012207, 14.869830131530762]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 7.0, 8.0, 10.0, 14.0, 20.0, 22.0, 27.0, 46.0, 41.0, 50.0, 66.0, 58.0, 53.0, 61.0, 58.0, 66.0, 56.0, 51.0, 51.0, 51.0, 36.0, 31.0, 29.0, 14.0, 17.0, 14.0, 16.0, 5.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.688377380371094, -5.542111396789551, -5.395845890045166, -5.249580383300781, -5.103314399719238, -4.957048416137695, -4.8107829093933105, -4.664517402648926, -4.518251419067383, -4.37198543548584, -4.225719928741455, -4.07945442199707, -3.9331884384155273, -3.7869226932525635, -3.6406569480895996, -3.4943912029266357, -3.348125457763672, -3.201859712600708, -3.055593967437744, -2.9093282222747803, -2.7630624771118164, -2.6167967319488525, -2.4705309867858887, -2.324265241622925, -2.177999496459961, -2.031733751296997, -1.8854680061340332, -1.7392022609710693, -1.5929365158081055, -1.4466707706451416, -1.3004050254821777, -1.1541392803192139, -1.0078730583190918, -0.8616073131561279, -0.7153415679931641, -0.5690758228302002, -0.42281007766723633, -0.27654433250427246, -0.1302785873413086, 0.015987157821655273, 0.16225290298461914, 0.308518648147583, 0.4547843933105469, 0.6010501384735107, 0.7473158836364746, 0.8935816287994385, 1.0398473739624023, 1.1861131191253662, 1.33237886428833, 1.478644609451294, 1.6249103546142578, 1.7711760997772217, 1.9174418449401855, 2.0637075901031494, 2.2099733352661133, 2.356239080429077, 2.502504825592041, 2.648770570755005, 2.7950363159179688, 2.9413020610809326, 3.0875678062438965, 3.2338335514068604, 3.380099296569824, 3.526365041732788, 3.672630786895752]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 3.0, 2.0, 3.0, 11.0, 9.0, 15.0, 26.0, 34.0, 39.0, 59.0, 81.0, 116.0, 202.0, 413.0, 887.0, 2234.0, 6277.0, 22344.0, 116857.0, 598641.0, 244700.0, 40262.0, 9606.0, 3191.0, 1200.0, 551.0, 285.0, 178.0, 84.0, 65.0, 45.0, 20.0, 27.0, 17.0, 11.0, 11.0, 7.0, 9.0, 6.0, 6.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.125, -4.0125732421875, -3.900146484375, -3.7877197265625, -3.67529296875, -3.5628662109375, -3.450439453125, -3.3380126953125, -3.2255859375, -3.1131591796875, -3.000732421875, -2.8883056640625, -2.77587890625, -2.6634521484375, -2.551025390625, -2.4385986328125, -2.326171875, -2.2137451171875, -2.101318359375, -1.9888916015625, -1.87646484375, -1.7640380859375, -1.651611328125, -1.5391845703125, -1.4267578125, -1.3143310546875, -1.201904296875, -1.0894775390625, -0.97705078125, -0.8646240234375, -0.752197265625, -0.6397705078125, -0.52734375, -0.4149169921875, -0.302490234375, -0.1900634765625, -0.07763671875, 0.0347900390625, 0.147216796875, 0.2596435546875, 0.3720703125, 0.4844970703125, 0.596923828125, 0.7093505859375, 0.82177734375, 0.9342041015625, 1.046630859375, 1.1590576171875, 1.271484375, 1.3839111328125, 1.496337890625, 1.6087646484375, 1.72119140625, 1.8336181640625, 1.946044921875, 2.0584716796875, 2.1708984375, 2.2833251953125, 2.395751953125, 2.5081787109375, 2.62060546875, 2.7330322265625, 2.845458984375, 2.9578857421875, 3.0703125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 6.0, 10.0, 19.0, 19.0, 45.0, 58.0, 95.0, 120.0, 113.0, 115.0, 114.0, 85.0, 66.0, 53.0, 39.0, 22.0, 13.0, 5.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8692703247070312, -0.8318023681640625, -0.7943344116210938, -0.756866455078125, -0.7193984985351562, -0.6819305419921875, -0.6444625854492188, -0.60699462890625, -0.5695266723632812, -0.5320587158203125, -0.49459075927734375, -0.457122802734375, -0.41965484619140625, -0.3821868896484375, -0.34471893310546875, -0.3072509765625, -0.26978302001953125, -0.2323150634765625, -0.19484710693359375, -0.157379150390625, -0.11991119384765625, -0.0824432373046875, -0.04497528076171875, -0.00750732421875, 0.02996063232421875, 0.0674285888671875, 0.10489654541015625, 0.142364501953125, 0.17983245849609375, 0.2173004150390625, 0.25476837158203125, 0.292236328125, 0.32970428466796875, 0.3671722412109375, 0.40464019775390625, 0.442108154296875, 0.47957611083984375, 0.5170440673828125, 0.5545120239257812, 0.59197998046875, 0.6294479370117188, 0.6669158935546875, 0.7043838500976562, 0.741851806640625, 0.7793197631835938, 0.8167877197265625, 0.8542556762695312, 0.8917236328125, 0.9291915893554688, 0.9666595458984375, 1.0041275024414062, 1.041595458984375, 1.0790634155273438, 1.1165313720703125, 1.1539993286132812, 1.19146728515625, 1.2289352416992188, 1.2664031982421875, 1.3038711547851562, 1.341339111328125, 1.3788070678710938, 1.4162750244140625, 1.4537429809570312, 1.4912109375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 7.0, 1.0, 5.0, 6.0, 8.0, 4.0, 8.0, 11.0, 21.0, 29.0, 41.0, 58.0, 113.0, 210.0, 401.0, 827.0, 1867.0, 4487.0, 12657.0, 42451.0, 182864.0, 555123.0, 184246.0, 42486.0, 12753.0, 4330.0, 1796.0, 802.0, 429.0, 182.0, 109.0, 65.0, 39.0, 34.0, 30.0, 24.0, 5.0, 5.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.66796875, -2.59063720703125, -2.5133056640625, -2.43597412109375, -2.358642578125, -2.28131103515625, -2.2039794921875, -2.12664794921875, -2.04931640625, -1.97198486328125, -1.8946533203125, -1.81732177734375, -1.739990234375, -1.66265869140625, -1.5853271484375, -1.50799560546875, -1.4306640625, -1.35333251953125, -1.2760009765625, -1.19866943359375, -1.121337890625, -1.04400634765625, -0.9666748046875, -0.88934326171875, -0.81201171875, -0.73468017578125, -0.6573486328125, -0.58001708984375, -0.502685546875, -0.42535400390625, -0.3480224609375, -0.27069091796875, -0.193359375, -0.11602783203125, -0.0386962890625, 0.03863525390625, 0.115966796875, 0.19329833984375, 0.2706298828125, 0.34796142578125, 0.42529296875, 0.50262451171875, 0.5799560546875, 0.65728759765625, 0.734619140625, 0.81195068359375, 0.8892822265625, 0.96661376953125, 1.0439453125, 1.12127685546875, 1.1986083984375, 1.27593994140625, 1.353271484375, 1.43060302734375, 1.5079345703125, 1.58526611328125, 1.66259765625, 1.73992919921875, 1.8172607421875, 1.89459228515625, 1.971923828125, 2.04925537109375, 2.1265869140625, 2.20391845703125, 2.28125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 6.0, 8.0, 7.0, 6.0, 10.0, 13.0, 16.0, 19.0, 21.0, 29.0, 35.0, 32.0, 29.0, 39.0, 40.0, 56.0, 41.0, 47.0, 49.0, 41.0, 47.0, 34.0, 48.0, 33.0, 51.0, 36.0, 31.0, 26.0, 21.0, 22.0, 20.0, 19.0, 10.0, 8.0, 12.0, 8.0, 8.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4453125, -2.3719482421875, -2.298583984375, -2.2252197265625, -2.15185546875, -2.0784912109375, -2.005126953125, -1.9317626953125, -1.8583984375, -1.7850341796875, -1.711669921875, -1.6383056640625, -1.56494140625, -1.4915771484375, -1.418212890625, -1.3448486328125, -1.271484375, -1.1981201171875, -1.124755859375, -1.0513916015625, -0.97802734375, -0.9046630859375, -0.831298828125, -0.7579345703125, -0.6845703125, -0.6112060546875, -0.537841796875, -0.4644775390625, -0.39111328125, -0.3177490234375, -0.244384765625, -0.1710205078125, -0.09765625, -0.0242919921875, 0.049072265625, 0.1224365234375, 0.19580078125, 0.2691650390625, 0.342529296875, 0.4158935546875, 0.4892578125, 0.5626220703125, 0.635986328125, 0.7093505859375, 0.78271484375, 0.8560791015625, 0.929443359375, 1.0028076171875, 1.076171875, 1.1495361328125, 1.222900390625, 1.2962646484375, 1.36962890625, 1.4429931640625, 1.516357421875, 1.5897216796875, 1.6630859375, 1.7364501953125, 1.809814453125, 1.8831787109375, 1.95654296875, 2.0299072265625, 2.103271484375, 2.1766357421875, 2.25]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 7.0, 14.0, 18.0, 56.0, 140.0, 377.0, 1728.0, 18648.0, 933808.0, 89087.0, 3646.0, 685.0, 184.0, 77.0, 33.0, 20.0, 7.0, 6.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.265625, -5.132965087890625, -5.00030517578125, -4.867645263671875, -4.7349853515625, -4.602325439453125, -4.46966552734375, -4.337005615234375, -4.204345703125, -4.071685791015625, -3.93902587890625, -3.806365966796875, -3.6737060546875, -3.541046142578125, -3.40838623046875, -3.275726318359375, -3.14306640625, -3.010406494140625, -2.87774658203125, -2.745086669921875, -2.6124267578125, -2.479766845703125, -2.34710693359375, -2.214447021484375, -2.081787109375, -1.949127197265625, -1.81646728515625, -1.683807373046875, -1.5511474609375, -1.418487548828125, -1.28582763671875, -1.153167724609375, -1.0205078125, -0.887847900390625, -0.75518798828125, -0.622528076171875, -0.4898681640625, -0.357208251953125, -0.22454833984375, -0.091888427734375, 0.040771484375, 0.173431396484375, 0.30609130859375, 0.438751220703125, 0.5714111328125, 0.704071044921875, 0.83673095703125, 0.969390869140625, 1.10205078125, 1.234710693359375, 1.36737060546875, 1.500030517578125, 1.6326904296875, 1.765350341796875, 1.89801025390625, 2.030670166015625, 2.163330078125, 2.295989990234375, 2.42864990234375, 2.561309814453125, 2.6939697265625, 2.826629638671875, 2.95928955078125, 3.091949462890625, 3.224609375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 7.0, 3.0, 6.0, 9.0, 6.0, 15.0, 22.0, 32.0, 46.0, 76.0, 91.0, 117.0, 143.0, 137.0, 88.0, 61.0, 42.0, 26.0, 16.0, 20.0, 8.0, 7.0, 9.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001863241195678711, -0.0001789722591638565, -0.00017162039875984192, -0.00016426853835582733, -0.00015691667795181274, -0.00014956481754779816, -0.00014221295714378357, -0.00013486109673976898, -0.0001275092363357544, -0.00012015737593173981, -0.00011280551552772522, -0.00010545365512371063, -9.810179471969604e-05, -9.074993431568146e-05, -8.339807391166687e-05, -7.604621350765228e-05, -6.86943531036377e-05, -6.134249269962311e-05, -5.399063229560852e-05, -4.663877189159393e-05, -3.9286911487579346e-05, -3.193505108356476e-05, -2.458319067955017e-05, -1.7231330275535583e-05, -9.879469871520996e-06, -2.5276094675064087e-06, 4.824250936508179e-06, 1.2176111340522766e-05, 1.9527971744537354e-05, 2.687983214855194e-05, 3.423169255256653e-05, 4.1583552956581116e-05, 4.89354133605957e-05, 5.628727376461029e-05, 6.363913416862488e-05, 7.099099457263947e-05, 7.834285497665405e-05, 8.569471538066864e-05, 9.304657578468323e-05, 0.00010039843618869781, 0.0001077502965927124, 0.00011510215699672699, 0.00012245401740074158, 0.00012980587780475616, 0.00013715773820877075, 0.00014450959861278534, 0.00015186145901679993, 0.00015921331942081451, 0.0001665651798248291, 0.0001739170402288437, 0.00018126890063285828, 0.00018862076103687286, 0.00019597262144088745, 0.00020332448184490204, 0.00021067634224891663, 0.0002180282026529312, 0.0002253800630569458, 0.0002327319234609604, 0.00024008378386497498, 0.00024743564426898956, 0.00025478750467300415, 0.00026213936507701874, 0.0002694912254810333, 0.0002768430858850479, 0.0002841949462890625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 6.0, 10.0, 16.0, 23.0, 49.0, 79.0, 136.0, 276.0, 846.0, 4152.0, 45924.0, 907238.0, 82396.0, 5728.0, 1044.0, 304.0, 128.0, 81.0, 41.0, 25.0, 24.0, 14.0, 6.0, 6.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.109375, -2.00689697265625, -1.9044189453125, -1.80194091796875, -1.699462890625, -1.59698486328125, -1.4945068359375, -1.39202880859375, -1.28955078125, -1.18707275390625, -1.0845947265625, -0.98211669921875, -0.879638671875, -0.77716064453125, -0.6746826171875, -0.57220458984375, -0.4697265625, -0.36724853515625, -0.2647705078125, -0.16229248046875, -0.059814453125, 0.04266357421875, 0.1451416015625, 0.24761962890625, 0.35009765625, 0.45257568359375, 0.5550537109375, 0.65753173828125, 0.760009765625, 0.86248779296875, 0.9649658203125, 1.06744384765625, 1.169921875, 1.27239990234375, 1.3748779296875, 1.47735595703125, 1.579833984375, 1.68231201171875, 1.7847900390625, 1.88726806640625, 1.98974609375, 2.09222412109375, 2.1947021484375, 2.29718017578125, 2.399658203125, 2.50213623046875, 2.6046142578125, 2.70709228515625, 2.8095703125, 2.91204833984375, 3.0145263671875, 3.11700439453125, 3.219482421875, 3.32196044921875, 3.4244384765625, 3.52691650390625, 3.62939453125, 3.73187255859375, 3.8343505859375, 3.93682861328125, 4.039306640625, 4.14178466796875, 4.2442626953125, 4.34674072265625, 4.44921875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 0.0, 14.0, 9.0, 25.0, 31.0, 31.0, 62.0, 73.0, 116.0, 138.0, 145.0, 123.0, 85.0, 51.0, 42.0, 22.0, 20.0, 6.0, 7.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.154296875, -1.09930419921875, -1.0443115234375, -0.98931884765625, -0.934326171875, -0.87933349609375, -0.8243408203125, -0.76934814453125, -0.71435546875, -0.65936279296875, -0.6043701171875, -0.54937744140625, -0.494384765625, -0.43939208984375, -0.3843994140625, -0.32940673828125, -0.2744140625, -0.21942138671875, -0.1644287109375, -0.10943603515625, -0.054443359375, 0.00054931640625, 0.0555419921875, 0.11053466796875, 0.16552734375, 0.22052001953125, 0.2755126953125, 0.33050537109375, 0.385498046875, 0.44049072265625, 0.4954833984375, 0.55047607421875, 0.60546875, 0.66046142578125, 0.7154541015625, 0.77044677734375, 0.825439453125, 0.88043212890625, 0.9354248046875, 0.99041748046875, 1.04541015625, 1.10040283203125, 1.1553955078125, 1.21038818359375, 1.265380859375, 1.32037353515625, 1.3753662109375, 1.43035888671875, 1.4853515625, 1.54034423828125, 1.5953369140625, 1.65032958984375, 1.705322265625, 1.76031494140625, 1.8153076171875, 1.87030029296875, 1.92529296875, 1.98028564453125, 2.0352783203125, 2.09027099609375, 2.145263671875, 2.20025634765625, 2.2552490234375, 2.31024169921875, 2.365234375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 8.0, 10.0, 21.0, 43.0, 75.0, 111.0, 168.0, 202.0, 178.0, 84.0, 47.0, 29.0, 14.0, 4.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.124906539916992, -21.42277717590332, -20.72064971923828, -20.01852035522461, -19.316390991210938, -18.6142635345459, -17.912134170532227, -17.210006713867188, -16.507877349853516, -15.80574893951416, -15.103620529174805, -14.401491165161133, -13.699362754821777, -12.997234344482422, -12.29510498046875, -11.592976570129395, -10.890848159790039, -10.188719749450684, -9.486591339111328, -8.784461975097656, -8.0823335647583, -7.380205154418945, -6.678076267242432, -5.975947380065918, -5.2738189697265625, -4.571690559387207, -3.8695616722106934, -3.167433023452759, -2.465304374694824, -1.7631757259368896, -1.061047077178955, -0.3589181900024414, 0.3432121276855469, 1.0453407764434814, 1.747469425201416, 2.4495980739593506, 3.151726722717285, 3.8538553714752197, 4.555984020233154, 5.258112907409668, 5.960241317749023, 6.662369728088379, 7.364498615264893, 8.066627502441406, 8.768755912780762, 9.470884323120117, 10.173013687133789, 10.875142097473145, 11.5772705078125, 12.279398918151855, 12.981527328491211, 13.683656692504883, 14.385785102844238, 15.087913513183594, 15.790042877197266, 16.492172241210938, 17.194299697875977, 17.89642906188965, 18.598556518554688, 19.30068588256836, 20.00281524658203, 20.70494270324707, 21.407072067260742, 22.10919952392578, 22.811328887939453]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 10.0, 7.0, 5.0, 11.0, 11.0, 21.0, 28.0, 22.0, 24.0, 34.0, 33.0, 40.0, 50.0, 45.0, 50.0, 55.0, 43.0, 61.0, 45.0, 40.0, 41.0, 37.0, 45.0, 40.0, 21.0, 31.0, 17.0, 26.0, 23.0, 15.0, 13.0, 12.0, 6.0, 8.0, 6.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-16.695240020751953, -16.235525131225586, -15.775811195373535, -15.316096305847168, -14.856382369995117, -14.39666748046875, -13.936952590942383, -13.477237701416016, -13.017523765563965, -12.557808876037598, -12.098094940185547, -11.63838005065918, -11.178665161132812, -10.718951225280762, -10.259236335754395, -9.799522399902344, -9.339807510375977, -8.88009262084961, -8.420378684997559, -7.960663795471191, -7.500949382781982, -7.041234970092773, -6.581520080566406, -6.121805667877197, -5.662091255187988, -5.202376842498779, -4.74266242980957, -4.282947540283203, -3.823233127593994, -3.363518714904785, -2.903804063796997, -2.444089412689209, -1.9843740463256836, -1.524659514427185, -1.0649449825286865, -0.605230450630188, -0.14551591873168945, 0.31419849395751953, 0.7739131450653076, 1.2336277961730957, 1.6933422088623047, 2.1530566215515137, 2.6127712726593018, 3.07248592376709, 3.532200336456299, 3.991914749145508, 4.451629638671875, 4.911344051361084, 5.371058464050293, 5.830772876739502, 6.290487289428711, 6.750202178955078, 7.209916591644287, 7.669631004333496, 8.129345893859863, 8.589059829711914, 9.048774719238281, 9.508489608764648, 9.9682035446167, 10.427918434143066, 10.887632369995117, 11.347347259521484, 11.807062149047852, 12.266777038574219, 12.72649097442627]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 12.0, 17.0, 18.0, 40.0, 44.0, 46.0, 128.0, 229.0, 452.0, 903.0, 2109.0, 5477.0, 17679.0, 101262.0, 3941805.0, 97486.0, 17088.0, 5526.0, 1994.0, 873.0, 399.0, 235.0, 133.0, 75.0, 50.0, 45.0, 31.0, 27.0, 11.0, 9.0, 8.0, 8.0, 5.0, 8.0, 14.0, 7.0, 7.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.35546875, -3.212646484375, -3.06982421875, -2.927001953125, -2.7841796875, -2.641357421875, -2.49853515625, -2.355712890625, -2.212890625, -2.070068359375, -1.92724609375, -1.784423828125, -1.6416015625, -1.498779296875, -1.35595703125, -1.213134765625, -1.0703125, -0.927490234375, -0.78466796875, -0.641845703125, -0.4990234375, -0.356201171875, -0.21337890625, -0.070556640625, 0.072265625, 0.215087890625, 0.35791015625, 0.500732421875, 0.6435546875, 0.786376953125, 0.92919921875, 1.072021484375, 1.21484375, 1.357666015625, 1.50048828125, 1.643310546875, 1.7861328125, 1.928955078125, 2.07177734375, 2.214599609375, 2.357421875, 2.500244140625, 2.64306640625, 2.785888671875, 2.9287109375, 3.071533203125, 3.21435546875, 3.357177734375, 3.5, 3.642822265625, 3.78564453125, 3.928466796875, 4.0712890625, 4.214111328125, 4.35693359375, 4.499755859375, 4.642578125, 4.785400390625, 4.92822265625, 5.071044921875, 5.2138671875, 5.356689453125, 5.49951171875, 5.642333984375, 5.78515625]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 7.0, 21.0, 25.0, 31.0, 54.0, 63.0, 83.0, 69.0, 103.0, 97.0, 100.0, 81.0, 65.0, 69.0, 40.0, 36.0, 16.0, 16.0, 10.0, 8.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92529296875, -0.8888168334960938, -0.8523406982421875, -0.8158645629882812, -0.779388427734375, -0.7429122924804688, -0.7064361572265625, -0.6699600219726562, -0.63348388671875, -0.5970077514648438, -0.5605316162109375, -0.5240554809570312, -0.487579345703125, -0.45110321044921875, -0.4146270751953125, -0.37815093994140625, -0.3416748046875, -0.30519866943359375, -0.2687225341796875, -0.23224639892578125, -0.195770263671875, -0.15929412841796875, -0.1228179931640625, -0.08634185791015625, -0.04986572265625, -0.01338958740234375, 0.0230865478515625, 0.05956268310546875, 0.096038818359375, 0.13251495361328125, 0.1689910888671875, 0.20546722412109375, 0.241943359375, 0.27841949462890625, 0.3148956298828125, 0.35137176513671875, 0.387847900390625, 0.42432403564453125, 0.4608001708984375, 0.49727630615234375, 0.53375244140625, 0.5702285766601562, 0.6067047119140625, 0.6431808471679688, 0.679656982421875, 0.7161331176757812, 0.7526092529296875, 0.7890853881835938, 0.8255615234375, 0.8620376586914062, 0.8985137939453125, 0.9349899291992188, 0.971466064453125, 1.0079421997070312, 1.0444183349609375, 1.0808944702148438, 1.11737060546875, 1.1538467407226562, 1.1903228759765625, 1.2267990112304688, 1.263275146484375, 1.2997512817382812, 1.3362274169921875, 1.3727035522460938, 1.4091796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 7.0, 5.0, 8.0, 15.0, 24.0, 48.0, 91.0, 147.0, 373.0, 656.0, 1329.0, 2846.0, 7472.0, 24643.0, 177741.0, 3847351.0, 101881.0, 18930.0, 6017.0, 2436.0, 1102.0, 525.0, 280.0, 155.0, 84.0, 41.0, 26.0, 12.0, 9.0, 10.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.71875, -4.585418701171875, -4.45208740234375, -4.318756103515625, -4.1854248046875, -4.052093505859375, -3.91876220703125, -3.785430908203125, -3.652099609375, -3.518768310546875, -3.38543701171875, -3.252105712890625, -3.1187744140625, -2.985443115234375, -2.85211181640625, -2.718780517578125, -2.58544921875, -2.452117919921875, -2.31878662109375, -2.185455322265625, -2.0521240234375, -1.918792724609375, -1.78546142578125, -1.652130126953125, -1.518798828125, -1.385467529296875, -1.25213623046875, -1.118804931640625, -0.9854736328125, -0.852142333984375, -0.71881103515625, -0.585479736328125, -0.4521484375, -0.318817138671875, -0.18548583984375, -0.052154541015625, 0.0811767578125, 0.214508056640625, 0.34783935546875, 0.481170654296875, 0.614501953125, 0.747833251953125, 0.88116455078125, 1.014495849609375, 1.1478271484375, 1.281158447265625, 1.41448974609375, 1.547821044921875, 1.68115234375, 1.814483642578125, 1.94781494140625, 2.081146240234375, 2.2144775390625, 2.347808837890625, 2.48114013671875, 2.614471435546875, 2.747802734375, 2.881134033203125, 3.01446533203125, 3.147796630859375, 3.2811279296875, 3.414459228515625, 3.54779052734375, 3.681121826171875, 3.814453125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 4.0, 4.0, 14.0, 4.0, 16.0, 19.0, 39.0, 46.0, 106.0, 347.0, 2484.0, 546.0, 189.0, 85.0, 50.0, 33.0, 25.0, 12.0, 13.0, 6.0, 6.0, 8.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.125, -2.066986083984375, -2.00897216796875, -1.950958251953125, -1.8929443359375, -1.834930419921875, -1.77691650390625, -1.718902587890625, -1.660888671875, -1.602874755859375, -1.54486083984375, -1.486846923828125, -1.4288330078125, -1.370819091796875, -1.31280517578125, -1.254791259765625, -1.19677734375, -1.138763427734375, -1.08074951171875, -1.022735595703125, -0.9647216796875, -0.906707763671875, -0.84869384765625, -0.790679931640625, -0.732666015625, -0.674652099609375, -0.61663818359375, -0.558624267578125, -0.5006103515625, -0.442596435546875, -0.38458251953125, -0.326568603515625, -0.2685546875, -0.210540771484375, -0.15252685546875, -0.094512939453125, -0.0364990234375, 0.021514892578125, 0.07952880859375, 0.137542724609375, 0.195556640625, 0.253570556640625, 0.31158447265625, 0.369598388671875, 0.4276123046875, 0.485626220703125, 0.54364013671875, 0.601654052734375, 0.65966796875, 0.717681884765625, 0.77569580078125, 0.833709716796875, 0.8917236328125, 0.949737548828125, 1.00775146484375, 1.065765380859375, 1.123779296875, 1.181793212890625, 1.23980712890625, 1.297821044921875, 1.3558349609375, 1.413848876953125, 1.47186279296875, 1.529876708984375, 1.587890625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 10.0, 7.0, 27.0, 49.0, 92.0, 133.0, 188.0, 185.0, 119.0, 84.0, 40.0, 21.0, 17.0, 9.0, 2.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-8.480589866638184, -8.147573471069336, -7.814557075500488, -7.481540679931641, -7.148524284362793, -6.815507888793945, -6.482491493225098, -6.14947509765625, -5.816458702087402, -5.483442306518555, -5.150425910949707, -4.817409515380859, -4.484393119812012, -4.151376724243164, -3.8183603286743164, -3.4853439331054688, -3.152327537536621, -2.8193111419677734, -2.486294746398926, -2.153278350830078, -1.8202619552612305, -1.4872455596923828, -1.1542291641235352, -0.8212127685546875, -0.48819637298583984, -0.1551799774169922, 0.17783641815185547, 0.5108528137207031, 0.8438692092895508, 1.1768856048583984, 1.509902000427246, 1.8429183959960938, 2.175935745239258, 2.5089521408081055, 2.841968536376953, 3.174984931945801, 3.5080013275146484, 3.841017723083496, 4.174034118652344, 4.507050514221191, 4.840066909790039, 5.173083305358887, 5.506099700927734, 5.839116096496582, 6.17213249206543, 6.505148887634277, 6.838165283203125, 7.171181678771973, 7.50419807434082, 7.837214469909668, 8.170230865478516, 8.503247261047363, 8.836263656616211, 9.169280052185059, 9.502296447753906, 9.835312843322754, 10.168329238891602, 10.50134563446045, 10.834362030029297, 11.167378425598145, 11.500394821166992, 11.83341121673584, 12.166427612304688, 12.499444007873535, 12.832460403442383]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 5.0, 5.0, 7.0, 7.0, 13.0, 16.0, 20.0, 15.0, 32.0, 28.0, 35.0, 40.0, 33.0, 49.0, 58.0, 54.0, 55.0, 64.0, 57.0, 72.0, 54.0, 42.0, 50.0, 36.0, 21.0, 28.0, 16.0, 22.0, 18.0, 16.0, 17.0, 5.0, 4.0, 3.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-7.382684707641602, -7.187432765960693, -6.992180824279785, -6.796928405761719, -6.6016764640808105, -6.406424522399902, -6.211172580718994, -6.015920639038086, -5.8206682205200195, -5.625416278839111, -5.430164337158203, -5.234911918640137, -5.0396599769592285, -4.84440803527832, -4.649156093597412, -4.453904151916504, -4.258652210235596, -4.0634002685546875, -3.8681480884552, -3.672896146774292, -3.4776439666748047, -3.2823920249938965, -3.0871400833129883, -2.89188814163208, -2.6966359615325928, -2.5013840198516846, -2.3061318397521973, -2.110879898071289, -1.9156278371810913, -1.7203757762908936, -1.5251238346099854, -1.3298717737197876, -1.1346192359924316, -0.9393671751022339, -0.7441151738166809, -0.5488631725311279, -0.3536111116409302, -0.15835905075073242, 0.03689289093017578, 0.23214495182037354, 0.4273970127105713, 0.622649073600769, 0.817901074886322, 1.013153076171875, 1.2084051370620728, 1.4036571979522705, 1.5989091396331787, 1.7941612005233765, 1.9894132614135742, 2.1846652030944824, 2.3799173831939697, 2.575169324874878, 2.7704215049743652, 2.9656734466552734, 3.1609253883361816, 3.35617733001709, 3.551429510116577, 3.7466814517974854, 3.9419336318969727, 4.137185573577881, 4.332437515258789, 4.5276899337768555, 4.7229413986206055, 4.918193817138672, 5.11344575881958]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 3.0, 8.0, 12.0, 17.0, 22.0, 48.0, 72.0, 142.0, 310.0, 658.0, 1785.0, 6441.0, 38343.0, 438035.0, 508904.0, 43424.0, 7078.0, 1916.0, 687.0, 308.0, 122.0, 77.0, 59.0, 28.0, 21.0, 11.0, 3.0, 6.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.09765625, -5.93731689453125, -5.7769775390625, -5.61663818359375, -5.456298828125, -5.29595947265625, -5.1356201171875, -4.97528076171875, -4.81494140625, -4.65460205078125, -4.4942626953125, -4.33392333984375, -4.173583984375, -4.01324462890625, -3.8529052734375, -3.69256591796875, -3.5322265625, -3.37188720703125, -3.2115478515625, -3.05120849609375, -2.890869140625, -2.73052978515625, -2.5701904296875, -2.40985107421875, -2.24951171875, -2.08917236328125, -1.9288330078125, -1.76849365234375, -1.608154296875, -1.44781494140625, -1.2874755859375, -1.12713623046875, -0.966796875, -0.80645751953125, -0.6461181640625, -0.48577880859375, -0.325439453125, -0.16510009765625, -0.0047607421875, 0.15557861328125, 0.31591796875, 0.47625732421875, 0.6365966796875, 0.79693603515625, 0.957275390625, 1.11761474609375, 1.2779541015625, 1.43829345703125, 1.5986328125, 1.75897216796875, 1.9193115234375, 2.07965087890625, 2.239990234375, 2.40032958984375, 2.5606689453125, 2.72100830078125, 2.88134765625, 3.04168701171875, 3.2020263671875, 3.36236572265625, 3.522705078125, 3.68304443359375, 3.8433837890625, 4.00372314453125, 4.1640625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 9.0, 20.0, 20.0, 27.0, 45.0, 60.0, 74.0, 82.0, 68.0, 92.0, 85.0, 82.0, 86.0, 61.0, 51.0, 52.0, 29.0, 19.0, 18.0, 10.0, 7.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89892578125, -0.8643112182617188, -0.8296966552734375, -0.7950820922851562, -0.760467529296875, -0.7258529663085938, -0.6912384033203125, -0.6566238403320312, -0.62200927734375, -0.5873947143554688, -0.5527801513671875, -0.5181655883789062, -0.483551025390625, -0.44893646240234375, -0.4143218994140625, -0.37970733642578125, -0.3450927734375, -0.31047821044921875, -0.2758636474609375, -0.24124908447265625, -0.206634521484375, -0.17201995849609375, -0.1374053955078125, -0.10279083251953125, -0.06817626953125, -0.03356170654296875, 0.0010528564453125, 0.03566741943359375, 0.070281982421875, 0.10489654541015625, 0.1395111083984375, 0.17412567138671875, 0.208740234375, 0.24335479736328125, 0.2779693603515625, 0.31258392333984375, 0.347198486328125, 0.38181304931640625, 0.4164276123046875, 0.45104217529296875, 0.48565673828125, 0.5202713012695312, 0.5548858642578125, 0.5895004272460938, 0.624114990234375, 0.6587295532226562, 0.6933441162109375, 0.7279586791992188, 0.7625732421875, 0.7971878051757812, 0.8318023681640625, 0.8664169311523438, 0.901031494140625, 0.9356460571289062, 0.9702606201171875, 1.0048751831054688, 1.03948974609375, 1.0741043090820312, 1.1087188720703125, 1.1433334350585938, 1.177947998046875, 1.2125625610351562, 1.2471771240234375, 1.2817916870117188, 1.31640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 6.0, 10.0, 11.0, 13.0, 12.0, 19.0, 16.0, 30.0, 34.0, 72.0, 95.0, 190.0, 388.0, 899.0, 2587.0, 9358.0, 42472.0, 273697.0, 590588.0, 101299.0, 19198.0, 4825.0, 1518.0, 598.0, 241.0, 132.0, 77.0, 48.0, 40.0, 19.0, 20.0, 12.0, 6.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.626953125, -3.526885986328125, -3.42681884765625, -3.326751708984375, -3.2266845703125, -3.126617431640625, -3.02655029296875, -2.926483154296875, -2.826416015625, -2.726348876953125, -2.62628173828125, -2.526214599609375, -2.4261474609375, -2.326080322265625, -2.22601318359375, -2.125946044921875, -2.02587890625, -1.925811767578125, -1.82574462890625, -1.725677490234375, -1.6256103515625, -1.525543212890625, -1.42547607421875, -1.325408935546875, -1.225341796875, -1.125274658203125, -1.02520751953125, -0.925140380859375, -0.8250732421875, -0.725006103515625, -0.62493896484375, -0.524871826171875, -0.4248046875, -0.324737548828125, -0.22467041015625, -0.124603271484375, -0.0245361328125, 0.075531005859375, 0.17559814453125, 0.275665283203125, 0.375732421875, 0.475799560546875, 0.57586669921875, 0.675933837890625, 0.7760009765625, 0.876068115234375, 0.97613525390625, 1.076202392578125, 1.17626953125, 1.276336669921875, 1.37640380859375, 1.476470947265625, 1.5765380859375, 1.676605224609375, 1.77667236328125, 1.876739501953125, 1.976806640625, 2.076873779296875, 2.17694091796875, 2.277008056640625, 2.3770751953125, 2.477142333984375, 2.57720947265625, 2.677276611328125, 2.77734375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 15.0, 11.0, 13.0, 16.0, 20.0, 23.0, 34.0, 31.0, 23.0, 33.0, 41.0, 42.0, 36.0, 43.0, 49.0, 45.0, 52.0, 47.0, 52.0, 42.0, 43.0, 39.0, 31.0, 31.0, 28.0, 26.0, 17.0, 16.0, 15.0, 12.0, 9.0, 12.0, 6.0, 6.0, 3.0, 7.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.0390625, -2.953857421875, -2.86865234375, -2.783447265625, -2.6982421875, -2.613037109375, -2.52783203125, -2.442626953125, -2.357421875, -2.272216796875, -2.18701171875, -2.101806640625, -2.0166015625, -1.931396484375, -1.84619140625, -1.760986328125, -1.67578125, -1.590576171875, -1.50537109375, -1.420166015625, -1.3349609375, -1.249755859375, -1.16455078125, -1.079345703125, -0.994140625, -0.908935546875, -0.82373046875, -0.738525390625, -0.6533203125, -0.568115234375, -0.48291015625, -0.397705078125, -0.3125, -0.227294921875, -0.14208984375, -0.056884765625, 0.0283203125, 0.113525390625, 0.19873046875, 0.283935546875, 0.369140625, 0.454345703125, 0.53955078125, 0.624755859375, 0.7099609375, 0.795166015625, 0.88037109375, 0.965576171875, 1.05078125, 1.135986328125, 1.22119140625, 1.306396484375, 1.3916015625, 1.476806640625, 1.56201171875, 1.647216796875, 1.732421875, 1.817626953125, 1.90283203125, 1.988037109375, 2.0732421875, 2.158447265625, 2.24365234375, 2.328857421875, 2.4140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 14.0, 12.0, 59.0, 177.0, 938.0, 38879.0, 1002803.0, 5101.0, 405.0, 106.0, 36.0, 11.0, 9.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.40234375, -6.19775390625, -5.9931640625, -5.78857421875, -5.583984375, -5.37939453125, -5.1748046875, -4.97021484375, -4.765625, -4.56103515625, -4.3564453125, -4.15185546875, -3.947265625, -3.74267578125, -3.5380859375, -3.33349609375, -3.12890625, -2.92431640625, -2.7197265625, -2.51513671875, -2.310546875, -2.10595703125, -1.9013671875, -1.69677734375, -1.4921875, -1.28759765625, -1.0830078125, -0.87841796875, -0.673828125, -0.46923828125, -0.2646484375, -0.06005859375, 0.14453125, 0.34912109375, 0.5537109375, 0.75830078125, 0.962890625, 1.16748046875, 1.3720703125, 1.57666015625, 1.78125, 1.98583984375, 2.1904296875, 2.39501953125, 2.599609375, 2.80419921875, 3.0087890625, 3.21337890625, 3.41796875, 3.62255859375, 3.8271484375, 4.03173828125, 4.236328125, 4.44091796875, 4.6455078125, 4.85009765625, 5.0546875, 5.25927734375, 5.4638671875, 5.66845703125, 5.873046875, 6.07763671875, 6.2822265625, 6.48681640625, 6.69140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 4.0, 9.0, 17.0, 25.0, 23.0, 49.0, 78.0, 136.0, 180.0, 176.0, 112.0, 59.0, 29.0, 37.0, 14.0, 10.0, 9.0, 7.0, 3.0, 2.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002727508544921875, -0.00026259198784828186, -0.0002524331212043762, -0.00024227425456047058, -0.00023211538791656494, -0.0002219565212726593, -0.00021179765462875366, -0.00020163878798484802, -0.00019147992134094238, -0.00018132105469703674, -0.0001711621880531311, -0.00016100332140922546, -0.00015084445476531982, -0.00014068558812141418, -0.00013052672147750854, -0.0001203678548336029, -0.00011020898818969727, -0.00010005012154579163, -8.989125490188599e-05, -7.973238825798035e-05, -6.957352161407471e-05, -5.941465497016907e-05, -4.925578832626343e-05, -3.909692168235779e-05, -2.893805503845215e-05, -1.877918839454651e-05, -8.620321750640869e-06, 1.5385448932647705e-06, 1.169741153717041e-05, 2.185627818107605e-05, 3.201514482498169e-05, 4.217401146888733e-05, 5.233287811279297e-05, 6.249174475669861e-05, 7.265061140060425e-05, 8.280947804450989e-05, 9.296834468841553e-05, 0.00010312721133232117, 0.0001132860779762268, 0.00012344494462013245, 0.00013360381126403809, 0.00014376267790794373, 0.00015392154455184937, 0.000164080411195755, 0.00017423927783966064, 0.00018439814448356628, 0.00019455701112747192, 0.00020471587777137756, 0.0002148747444152832, 0.00022503361105918884, 0.00023519247770309448, 0.0002453513443470001, 0.00025551021099090576, 0.0002656690776348114, 0.00027582794427871704, 0.0002859868109226227, 0.0002961456775665283, 0.00030630454421043396, 0.0003164634108543396, 0.00032662227749824524, 0.0003367811441421509, 0.0003469400107860565, 0.00035709887742996216, 0.0003672577440738678, 0.00037741661071777344]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 13.0, 21.0, 19.0, 70.0, 168.0, 443.0, 4743.0, 995965.0, 45679.0, 987.0, 227.0, 115.0, 43.0, 31.0, 12.0, 10.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.58203125, -4.38043212890625, -4.1788330078125, -3.97723388671875, -3.775634765625, -3.57403564453125, -3.3724365234375, -3.17083740234375, -2.96923828125, -2.76763916015625, -2.5660400390625, -2.36444091796875, -2.162841796875, -1.96124267578125, -1.7596435546875, -1.55804443359375, -1.3564453125, -1.15484619140625, -0.9532470703125, -0.75164794921875, -0.550048828125, -0.34844970703125, -0.1468505859375, 0.05474853515625, 0.25634765625, 0.45794677734375, 0.6595458984375, 0.86114501953125, 1.062744140625, 1.26434326171875, 1.4659423828125, 1.66754150390625, 1.869140625, 2.07073974609375, 2.2723388671875, 2.47393798828125, 2.675537109375, 2.87713623046875, 3.0787353515625, 3.28033447265625, 3.48193359375, 3.68353271484375, 3.8851318359375, 4.08673095703125, 4.288330078125, 4.48992919921875, 4.6915283203125, 4.89312744140625, 5.0947265625, 5.29632568359375, 5.4979248046875, 5.69952392578125, 5.901123046875, 6.10272216796875, 6.3043212890625, 6.50592041015625, 6.70751953125, 6.90911865234375, 7.1107177734375, 7.31231689453125, 7.513916015625, 7.71551513671875, 7.9171142578125, 8.11871337890625, 8.3203125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 18.0, 62.0, 200.0, 413.0, 212.0, 68.0, 18.0, 9.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.951171875, -2.800384521484375, -2.64959716796875, -2.498809814453125, -2.3480224609375, -2.197235107421875, -2.04644775390625, -1.895660400390625, -1.744873046875, -1.594085693359375, -1.44329833984375, -1.292510986328125, -1.1417236328125, -0.990936279296875, -0.84014892578125, -0.689361572265625, -0.53857421875, -0.387786865234375, -0.23699951171875, -0.086212158203125, 0.0645751953125, 0.215362548828125, 0.36614990234375, 0.516937255859375, 0.667724609375, 0.818511962890625, 0.96929931640625, 1.120086669921875, 1.2708740234375, 1.421661376953125, 1.57244873046875, 1.723236083984375, 1.8740234375, 2.024810791015625, 2.17559814453125, 2.326385498046875, 2.4771728515625, 2.627960205078125, 2.77874755859375, 2.929534912109375, 3.080322265625, 3.231109619140625, 3.38189697265625, 3.532684326171875, 3.6834716796875, 3.834259033203125, 3.98504638671875, 4.135833740234375, 4.28662109375, 4.437408447265625, 4.58819580078125, 4.738983154296875, 4.8897705078125, 5.040557861328125, 5.19134521484375, 5.342132568359375, 5.492919921875, 5.643707275390625, 5.79449462890625, 5.945281982421875, 6.0960693359375, 6.246856689453125, 6.39764404296875, 6.548431396484375, 6.69921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 9.0, 35.0, 129.0, 347.0, 331.0, 119.0, 21.0, 12.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.394371032714844, -30.85837745666504, -29.322385787963867, -27.786392211914062, -26.250398635864258, -24.714405059814453, -23.17841339111328, -21.642419815063477, -20.106426239013672, -18.570432662963867, -17.034440994262695, -15.49844741821289, -13.962453842163086, -12.426461219787598, -10.89046859741211, -9.354475021362305, -7.818483352661133, -6.282490253448486, -4.74649715423584, -3.2105045318603516, -1.674511432647705, -0.1385183334350586, 1.3974742889404297, 2.9334678649902344, 4.469460487365723, 6.005453586578369, 7.541446685791016, 9.077439308166504, 10.613431930541992, 12.149425506591797, 13.685418128967285, 15.22141170501709, 16.757404327392578, 18.293397903442383, 19.829389572143555, 21.36538314819336, 22.901376724243164, 24.43737030029297, 25.97336196899414, 27.509355545043945, 29.04534912109375, 30.581342697143555, 32.11733627319336, 33.65332794189453, 35.1893196105957, 36.72531509399414, 38.26130676269531, 39.79730224609375, 41.333290100097656, 42.86928176879883, 44.405277252197266, 45.94126892089844, 47.47726058959961, 49.01325607299805, 50.54924774169922, 52.085243225097656, 53.62123489379883, 55.1572265625, 56.69322204589844, 58.22921371459961, 59.76520538330078, 61.30120086669922, 62.83719253540039, 64.37318420410156, 65.9091796875]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 6.0, 7.0, 3.0, 7.0, 18.0, 15.0, 20.0, 30.0, 26.0, 30.0, 28.0, 32.0, 33.0, 47.0, 36.0, 43.0, 41.0, 34.0, 42.0, 45.0, 53.0, 40.0, 36.0, 26.0, 40.0, 33.0, 35.0, 37.0, 28.0, 19.0, 22.0, 21.0, 14.0, 12.0, 15.0, 6.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-15.0291748046875, -14.618408203125, -14.2076416015625, -13.796875, -13.3861083984375, -12.975341796875, -12.5645751953125, -12.15380859375, -11.7430419921875, -11.332275390625, -10.9215087890625, -10.5107421875, -10.0999755859375, -9.689208984375, -9.2784423828125, -8.86767578125, -8.4569091796875, -8.046142578125, -7.6353759765625, -7.224609375, -6.8138427734375, -6.403076171875, -5.9923095703125, -5.58154296875, -5.170775413513184, -4.760008811950684, -4.349242210388184, -3.9384756088256836, -3.5277090072631836, -3.1169421672821045, -2.7061755657196045, -2.2954089641571045, -1.8846426010131836, -1.4738759994506836, -1.0631093978881836, -0.652342677116394, -0.24157607555389404, 0.1691906452178955, 0.5799572467803955, 0.9907238483428955, 1.4014904499053955, 1.8122570514678955, 2.2230236530303955, 2.6337904930114746, 3.0445570945739746, 3.4553236961364746, 3.8660902976989746, 4.276856899261475, 4.687623500823975, 5.098390102386475, 5.509156703948975, 5.919923305511475, 6.330689907073975, 6.741456985473633, 7.152223587036133, 7.562990188598633, 7.973756790161133, 8.384523391723633, 8.795289993286133, 9.206056594848633, 9.616823196411133, 10.027589797973633, 10.438356399536133, 10.849123001098633, 11.259889602661133]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 5.0, 8.0, 23.0, 33.0, 35.0, 57.0, 92.0, 161.0, 287.0, 628.0, 1455.0, 4431.0, 18747.0, 825551.0, 3315145.0, 20401.0, 4538.0, 1374.0, 561.0, 303.0, 147.0, 85.0, 63.0, 30.0, 26.0, 28.0, 11.0, 7.0, 11.0, 8.0, 7.0, 5.0, 5.0, 7.0, 3.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-5.296875, -5.1143798828125, -4.931884765625, -4.7493896484375, -4.56689453125, -4.3843994140625, -4.201904296875, -4.0194091796875, -3.8369140625, -3.6544189453125, -3.471923828125, -3.2894287109375, -3.10693359375, -2.9244384765625, -2.741943359375, -2.5594482421875, -2.376953125, -2.1944580078125, -2.011962890625, -1.8294677734375, -1.64697265625, -1.4644775390625, -1.281982421875, -1.0994873046875, -0.9169921875, -0.7344970703125, -0.552001953125, -0.3695068359375, -0.18701171875, -0.0045166015625, 0.177978515625, 0.3604736328125, 0.54296875, 0.7254638671875, 0.907958984375, 1.0904541015625, 1.27294921875, 1.4554443359375, 1.637939453125, 1.8204345703125, 2.0029296875, 2.1854248046875, 2.367919921875, 2.5504150390625, 2.73291015625, 2.9154052734375, 3.097900390625, 3.2803955078125, 3.462890625, 3.6453857421875, 3.827880859375, 4.0103759765625, 4.19287109375, 4.3753662109375, 4.557861328125, 4.7403564453125, 4.9228515625, 5.1053466796875, 5.287841796875, 5.4703369140625, 5.65283203125, 5.8353271484375, 6.017822265625, 6.2003173828125, 6.3828125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 3.0, 5.0, 3.0, 16.0, 14.0, 31.0, 47.0, 56.0, 71.0, 66.0, 76.0, 74.0, 82.0, 90.0, 91.0, 64.0, 59.0, 49.0, 43.0, 22.0, 17.0, 15.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.8985443115234375, -0.861541748046875, -0.8245391845703125, -0.78753662109375, -0.7505340576171875, -0.713531494140625, -0.6765289306640625, -0.6395263671875, -0.6025238037109375, -0.565521240234375, -0.5285186767578125, -0.49151611328125, -0.4545135498046875, -0.417510986328125, -0.3805084228515625, -0.343505859375, -0.3065032958984375, -0.269500732421875, -0.2324981689453125, -0.19549560546875, -0.1584930419921875, -0.121490478515625, -0.0844879150390625, -0.0474853515625, -0.0104827880859375, 0.026519775390625, 0.0635223388671875, 0.10052490234375, 0.1375274658203125, 0.174530029296875, 0.2115325927734375, 0.24853515625, 0.2855377197265625, 0.322540283203125, 0.3595428466796875, 0.39654541015625, 0.4335479736328125, 0.470550537109375, 0.5075531005859375, 0.5445556640625, 0.5815582275390625, 0.618560791015625, 0.6555633544921875, 0.69256591796875, 0.7295684814453125, 0.766571044921875, 0.8035736083984375, 0.840576171875, 0.8775787353515625, 0.914581298828125, 0.9515838623046875, 0.98858642578125, 1.0255889892578125, 1.062591552734375, 1.0995941162109375, 1.1365966796875, 1.1735992431640625, 1.210601806640625, 1.2476043701171875, 1.28460693359375, 1.3216094970703125, 1.358612060546875, 1.3956146240234375, 1.4326171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 9.0, 10.0, 19.0, 15.0, 49.0, 43.0, 57.0, 76.0, 135.0, 208.0, 472.0, 1213.0, 7001.0, 169175.0, 3995154.0, 17074.0, 2207.0, 647.0, 282.0, 160.0, 92.0, 65.0, 25.0, 29.0, 15.0, 10.0, 14.0, 9.0, 7.0, 6.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.8984375, -10.62725830078125, -10.3560791015625, -10.08489990234375, -9.813720703125, -9.54254150390625, -9.2713623046875, -9.00018310546875, -8.72900390625, -8.45782470703125, -8.1866455078125, -7.91546630859375, -7.644287109375, -7.37310791015625, -7.1019287109375, -6.83074951171875, -6.5595703125, -6.28839111328125, -6.0172119140625, -5.74603271484375, -5.474853515625, -5.20367431640625, -4.9324951171875, -4.66131591796875, -4.39013671875, -4.11895751953125, -3.8477783203125, -3.57659912109375, -3.305419921875, -3.03424072265625, -2.7630615234375, -2.49188232421875, -2.220703125, -1.94952392578125, -1.6783447265625, -1.40716552734375, -1.135986328125, -0.86480712890625, -0.5936279296875, -0.32244873046875, -0.05126953125, 0.21990966796875, 0.4910888671875, 0.76226806640625, 1.033447265625, 1.30462646484375, 1.5758056640625, 1.84698486328125, 2.1181640625, 2.38934326171875, 2.6605224609375, 2.93170166015625, 3.202880859375, 3.47406005859375, 3.7452392578125, 4.01641845703125, 4.28759765625, 4.55877685546875, 4.8299560546875, 5.10113525390625, 5.372314453125, 5.64349365234375, 5.9146728515625, 6.18585205078125, 6.45703125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 9.0, 15.0, 31.0, 91.0, 440.0, 3213.0, 193.0, 48.0, 16.0, 10.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.55859375, -4.450653076171875, -4.34271240234375, -4.234771728515625, -4.1268310546875, -4.018890380859375, -3.91094970703125, -3.803009033203125, -3.695068359375, -3.587127685546875, -3.47918701171875, -3.371246337890625, -3.2633056640625, -3.155364990234375, -3.04742431640625, -2.939483642578125, -2.83154296875, -2.723602294921875, -2.61566162109375, -2.507720947265625, -2.3997802734375, -2.291839599609375, -2.18389892578125, -2.075958251953125, -1.968017578125, -1.860076904296875, -1.75213623046875, -1.644195556640625, -1.5362548828125, -1.428314208984375, -1.32037353515625, -1.212432861328125, -1.1044921875, -0.996551513671875, -0.88861083984375, -0.780670166015625, -0.6727294921875, -0.564788818359375, -0.45684814453125, -0.348907470703125, -0.240966796875, -0.133026123046875, -0.02508544921875, 0.082855224609375, 0.1907958984375, 0.298736572265625, 0.40667724609375, 0.514617919921875, 0.62255859375, 0.730499267578125, 0.83843994140625, 0.946380615234375, 1.0543212890625, 1.162261962890625, 1.27020263671875, 1.378143310546875, 1.486083984375, 1.594024658203125, 1.70196533203125, 1.809906005859375, 1.9178466796875, 2.025787353515625, 2.13372802734375, 2.241668701171875, 2.349609375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 8.0, 19.0, 16.0, 53.0, 87.0, 178.0, 278.0, 220.0, 76.0, 41.0, 9.0, 8.0, 4.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.886222839355469, -9.479033470153809, -9.071845054626465, -8.664655685424805, -8.257466316223145, -7.850277423858643, -7.443088531494141, -7.0358991622924805, -6.62870979309082, -6.221520900726318, -5.814331531524658, -5.407142639160156, -4.999953269958496, -4.592764377593994, -4.185575485229492, -3.778386116027832, -3.37119722366333, -2.964008092880249, -2.556818962097168, -2.149630069732666, -1.7424408197402954, -1.335251808166504, -0.9280626773834229, -0.5208735466003418, -0.11368441581726074, 0.2935046851634979, 0.7006937861442566, 1.1078828573226929, 1.515071988105774, 1.9222609996795654, 2.3294501304626465, 2.7366392612457275, 3.1438283920288086, 3.5510175228118896, 3.9582066535949707, 4.365395545959473, 4.772584915161133, 5.179773807525635, 5.586962699890137, 5.994152069091797, 6.401341438293457, 6.808530330657959, 7.215719699859619, 7.622908592224121, 8.030097961425781, 8.437286376953125, 8.844475746154785, 9.251665115356445, 9.658853530883789, 10.06604290008545, 10.473231315612793, 10.880420684814453, 11.287610054016113, 11.694799423217773, 12.101987838745117, 12.509177207946777, 12.916366577148438, 13.323555946350098, 13.730744361877441, 14.137933731079102, 14.545123100280762, 14.952312469482422, 15.359500885009766, 15.766690254211426, 16.173879623413086]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 7.0, 7.0, 6.0, 9.0, 12.0, 15.0, 14.0, 23.0, 24.0, 33.0, 28.0, 41.0, 42.0, 41.0, 48.0, 54.0, 41.0, 44.0, 46.0, 47.0, 53.0, 57.0, 37.0, 38.0, 36.0, 28.0, 29.0, 30.0, 16.0, 23.0, 9.0, 17.0, 8.0, 12.0, 8.0, 6.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.456357479095459, -5.305401802062988, -5.154446125030518, -5.003490447998047, -4.852534294128418, -4.701578617095947, -4.550622940063477, -4.399667263031006, -4.248711585998535, -4.0977559089660645, -3.9468002319335938, -3.795844316482544, -3.6448886394500732, -3.4939329624176025, -3.3429770469665527, -3.192021369934082, -3.0410656929016113, -2.8901100158691406, -2.73915433883667, -2.58819842338562, -2.4372427463531494, -2.2862870693206787, -2.135331153869629, -1.9843754768371582, -1.8334197998046875, -1.6824641227722168, -1.5315083265304565, -1.3805525302886963, -1.2295968532562256, -1.0786411762237549, -0.9276853799819946, -0.7767295837402344, -0.6257734298706055, -0.47481769323349, -0.3238619565963745, -0.17290621995925903, -0.021950483322143555, 0.12900525331497192, 0.2799609899520874, 0.43091678619384766, 0.5818724632263184, 0.7328281998634338, 0.8837839365005493, 1.0347397327423096, 1.1856954097747803, 1.336651086807251, 1.4876068830490112, 1.6385626792907715, 1.7895183563232422, 1.940474033355713, 2.0914297103881836, 2.2423856258392334, 2.393341302871704, 2.544296979904175, 2.6952528953552246, 2.8462085723876953, 2.997164249420166, 3.1481199264526367, 3.2990756034851074, 3.4500315189361572, 3.600987195968628, 3.7519428730010986, 3.9028987884521484, 4.053854465484619, 4.20481014251709]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 12.0, 12.0, 20.0, 29.0, 61.0, 94.0, 255.0, 620.0, 1960.0, 8109.0, 62913.0, 765802.0, 186674.0, 17032.0, 3288.0, 994.0, 360.0, 149.0, 55.0, 41.0, 21.0, 18.0, 13.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.05859375, -4.869140625, -4.6796875, -4.490234375, -4.30078125, -4.111328125, -3.921875, -3.732421875, -3.54296875, -3.353515625, -3.1640625, -2.974609375, -2.78515625, -2.595703125, -2.40625, -2.216796875, -2.02734375, -1.837890625, -1.6484375, -1.458984375, -1.26953125, -1.080078125, -0.890625, -0.701171875, -0.51171875, -0.322265625, -0.1328125, 0.056640625, 0.24609375, 0.435546875, 0.625, 0.814453125, 1.00390625, 1.193359375, 1.3828125, 1.572265625, 1.76171875, 1.951171875, 2.140625, 2.330078125, 2.51953125, 2.708984375, 2.8984375, 3.087890625, 3.27734375, 3.466796875, 3.65625, 3.845703125, 4.03515625, 4.224609375, 4.4140625, 4.603515625, 4.79296875, 4.982421875, 5.171875, 5.361328125, 5.55078125, 5.740234375, 5.9296875, 6.119140625, 6.30859375, 6.498046875, 6.6875, 6.876953125, 7.06640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 14.0, 12.0, 21.0, 31.0, 52.0, 65.0, 66.0, 66.0, 79.0, 82.0, 70.0, 74.0, 82.0, 64.0, 51.0, 40.0, 43.0, 28.0, 23.0, 13.0, 4.0, 8.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91796875, -0.879852294921875, -0.84173583984375, -0.803619384765625, -0.7655029296875, -0.727386474609375, -0.68927001953125, -0.651153564453125, -0.613037109375, -0.574920654296875, -0.53680419921875, -0.498687744140625, -0.4605712890625, -0.422454833984375, -0.38433837890625, -0.346221923828125, -0.30810546875, -0.269989013671875, -0.23187255859375, -0.193756103515625, -0.1556396484375, -0.117523193359375, -0.07940673828125, -0.041290283203125, -0.003173828125, 0.034942626953125, 0.07305908203125, 0.111175537109375, 0.1492919921875, 0.187408447265625, 0.22552490234375, 0.263641357421875, 0.3017578125, 0.339874267578125, 0.37799072265625, 0.416107177734375, 0.4542236328125, 0.492340087890625, 0.53045654296875, 0.568572998046875, 0.606689453125, 0.644805908203125, 0.68292236328125, 0.721038818359375, 0.7591552734375, 0.797271728515625, 0.83538818359375, 0.873504638671875, 0.91162109375, 0.949737548828125, 0.98785400390625, 1.025970458984375, 1.0640869140625, 1.102203369140625, 1.14031982421875, 1.178436279296875, 1.216552734375, 1.254669189453125, 1.29278564453125, 1.330902099609375, 1.3690185546875, 1.407135009765625, 1.44525146484375, 1.483367919921875, 1.521484375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 4.0, 2.0, 6.0, 5.0, 12.0, 15.0, 14.0, 20.0, 40.0, 61.0, 122.0, 186.0, 287.0, 528.0, 1029.0, 2229.0, 6030.0, 23284.0, 133674.0, 671606.0, 169506.0, 27740.0, 7111.0, 2568.0, 1135.0, 582.0, 327.0, 159.0, 91.0, 52.0, 41.0, 23.0, 16.0, 10.0, 11.0, 4.0, 5.0, 8.0, 5.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.697265625, -3.580108642578125, -3.46295166015625, -3.345794677734375, -3.2286376953125, -3.111480712890625, -2.99432373046875, -2.877166748046875, -2.760009765625, -2.642852783203125, -2.52569580078125, -2.408538818359375, -2.2913818359375, -2.174224853515625, -2.05706787109375, -1.939910888671875, -1.82275390625, -1.705596923828125, -1.58843994140625, -1.471282958984375, -1.3541259765625, -1.236968994140625, -1.11981201171875, -1.002655029296875, -0.885498046875, -0.768341064453125, -0.65118408203125, -0.534027099609375, -0.4168701171875, -0.299713134765625, -0.18255615234375, -0.065399169921875, 0.0517578125, 0.168914794921875, 0.28607177734375, 0.403228759765625, 0.5203857421875, 0.637542724609375, 0.75469970703125, 0.871856689453125, 0.989013671875, 1.106170654296875, 1.22332763671875, 1.340484619140625, 1.4576416015625, 1.574798583984375, 1.69195556640625, 1.809112548828125, 1.92626953125, 2.043426513671875, 2.16058349609375, 2.277740478515625, 2.3948974609375, 2.512054443359375, 2.62921142578125, 2.746368408203125, 2.863525390625, 2.980682373046875, 3.09783935546875, 3.214996337890625, 3.3321533203125, 3.449310302734375, 3.56646728515625, 3.683624267578125, 3.80078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 7.0, 6.0, 7.0, 3.0, 8.0, 10.0, 5.0, 13.0, 20.0, 13.0, 22.0, 26.0, 27.0, 24.0, 22.0, 38.0, 33.0, 30.0, 33.0, 40.0, 36.0, 31.0, 46.0, 45.0, 42.0, 52.0, 44.0, 33.0, 35.0, 46.0, 23.0, 25.0, 16.0, 23.0, 15.0, 12.0, 20.0, 15.0, 15.0, 8.0, 11.0, 3.0, 6.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-2.84375, -2.756500244140625, -2.66925048828125, -2.582000732421875, -2.4947509765625, -2.407501220703125, -2.32025146484375, -2.233001708984375, -2.145751953125, -2.058502197265625, -1.97125244140625, -1.884002685546875, -1.7967529296875, -1.709503173828125, -1.62225341796875, -1.535003662109375, -1.44775390625, -1.360504150390625, -1.27325439453125, -1.186004638671875, -1.0987548828125, -1.011505126953125, -0.92425537109375, -0.837005615234375, -0.749755859375, -0.662506103515625, -0.57525634765625, -0.488006591796875, -0.4007568359375, -0.313507080078125, -0.22625732421875, -0.139007568359375, -0.0517578125, 0.035491943359375, 0.12274169921875, 0.209991455078125, 0.2972412109375, 0.384490966796875, 0.47174072265625, 0.558990478515625, 0.646240234375, 0.733489990234375, 0.82073974609375, 0.907989501953125, 0.9952392578125, 1.082489013671875, 1.16973876953125, 1.256988525390625, 1.34423828125, 1.431488037109375, 1.51873779296875, 1.605987548828125, 1.6932373046875, 1.780487060546875, 1.86773681640625, 1.954986572265625, 2.042236328125, 2.129486083984375, 2.21673583984375, 2.303985595703125, 2.3912353515625, 2.478485107421875, 2.56573486328125, 2.652984619140625, 2.740234375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 4.0, 12.0, 17.0, 35.0, 53.0, 86.0, 168.0, 375.0, 1002.0, 3215.0, 15691.0, 404390.0, 598907.0, 18978.0, 3659.0, 1119.0, 421.0, 205.0, 91.0, 57.0, 25.0, 22.0, 10.0, 7.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.529296875, -2.439117431640625, -2.34893798828125, -2.258758544921875, -2.1685791015625, -2.078399658203125, -1.98822021484375, -1.898040771484375, -1.807861328125, -1.717681884765625, -1.62750244140625, -1.537322998046875, -1.4471435546875, -1.356964111328125, -1.26678466796875, -1.176605224609375, -1.08642578125, -0.996246337890625, -0.90606689453125, -0.815887451171875, -0.7257080078125, -0.635528564453125, -0.54534912109375, -0.455169677734375, -0.364990234375, -0.274810791015625, -0.18463134765625, -0.094451904296875, -0.0042724609375, 0.085906982421875, 0.17608642578125, 0.266265869140625, 0.3564453125, 0.446624755859375, 0.53680419921875, 0.626983642578125, 0.7171630859375, 0.807342529296875, 0.89752197265625, 0.987701416015625, 1.077880859375, 1.168060302734375, 1.25823974609375, 1.348419189453125, 1.4385986328125, 1.528778076171875, 1.61895751953125, 1.709136962890625, 1.79931640625, 1.889495849609375, 1.97967529296875, 2.069854736328125, 2.1600341796875, 2.250213623046875, 2.34039306640625, 2.430572509765625, 2.520751953125, 2.610931396484375, 2.70111083984375, 2.791290283203125, 2.8814697265625, 2.971649169921875, 3.06182861328125, 3.152008056640625, 3.2421875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 10.0, 15.0, 16.0, 23.0, 44.0, 69.0, 172.0, 253.0, 177.0, 95.0, 48.0, 34.0, 15.0, 19.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00036334991455078125, -0.0003485828638076782, -0.0003338158130645752, -0.00031904876232147217, -0.00030428171157836914, -0.0002895146608352661, -0.0002747476100921631, -0.00025998055934906006, -0.00024521350860595703, -0.000230446457862854, -0.00021567940711975098, -0.00020091235637664795, -0.00018614530563354492, -0.0001713782548904419, -0.00015661120414733887, -0.00014184415340423584, -0.0001270771026611328, -0.00011231005191802979, -9.754300117492676e-05, -8.277595043182373e-05, -6.80088996887207e-05, -5.3241848945617676e-05, -3.847479820251465e-05, -2.370774745941162e-05, -8.940696716308594e-06, 5.826354026794434e-06, 2.059340476989746e-05, 3.536045551300049e-05, 5.0127506256103516e-05, 6.489455699920654e-05, 7.966160774230957e-05, 9.44286584854126e-05, 0.00010919570922851562, 0.00012396275997161865, 0.00013872981071472168, 0.0001534968614578247, 0.00016826391220092773, 0.00018303096294403076, 0.0001977980136871338, 0.00021256506443023682, 0.00022733211517333984, 0.00024209916591644287, 0.0002568662166595459, 0.0002716332674026489, 0.00028640031814575195, 0.000301167368888855, 0.000315934419631958, 0.00033070147037506104, 0.00034546852111816406, 0.0003602355718612671, 0.0003750026226043701, 0.00038976967334747314, 0.00040453672409057617, 0.0004193037748336792, 0.0004340708255767822, 0.00044883787631988525, 0.0004636049270629883, 0.0004783719778060913, 0.0004931390285491943, 0.0005079060792922974, 0.0005226731300354004, 0.0005374401807785034, 0.0005522072315216064, 0.0005669742822647095, 0.0005817413330078125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 5.0, 7.0, 11.0, 12.0, 21.0, 25.0, 45.0, 95.0, 178.0, 366.0, 992.0, 3523.0, 27204.0, 879689.0, 125965.0, 7723.0, 1605.0, 568.0, 248.0, 120.0, 54.0, 36.0, 18.0, 17.0, 8.0, 7.0, 6.0, 7.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.889129638671875, -2.79193115234375, -2.694732666015625, -2.5975341796875, -2.500335693359375, -2.40313720703125, -2.305938720703125, -2.208740234375, -2.111541748046875, -2.01434326171875, -1.917144775390625, -1.8199462890625, -1.722747802734375, -1.62554931640625, -1.528350830078125, -1.43115234375, -1.333953857421875, -1.23675537109375, -1.139556884765625, -1.0423583984375, -0.945159912109375, -0.84796142578125, -0.750762939453125, -0.653564453125, -0.556365966796875, -0.45916748046875, -0.361968994140625, -0.2647705078125, -0.167572021484375, -0.07037353515625, 0.026824951171875, 0.1240234375, 0.221221923828125, 0.31842041015625, 0.415618896484375, 0.5128173828125, 0.610015869140625, 0.70721435546875, 0.804412841796875, 0.901611328125, 0.998809814453125, 1.09600830078125, 1.193206787109375, 1.2904052734375, 1.387603759765625, 1.48480224609375, 1.582000732421875, 1.67919921875, 1.776397705078125, 1.87359619140625, 1.970794677734375, 2.0679931640625, 2.165191650390625, 2.26239013671875, 2.359588623046875, 2.456787109375, 2.553985595703125, 2.65118408203125, 2.748382568359375, 2.8455810546875, 2.942779541015625, 3.03997802734375, 3.137176513671875, 3.234375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 9.0, 6.0, 11.0, 13.0, 13.0, 24.0, 36.0, 48.0, 66.0, 131.0, 152.0, 163.0, 121.0, 76.0, 48.0, 24.0, 22.0, 12.0, 8.0, 3.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.658203125, -1.60296630859375, -1.5477294921875, -1.49249267578125, -1.437255859375, -1.38201904296875, -1.3267822265625, -1.27154541015625, -1.21630859375, -1.16107177734375, -1.1058349609375, -1.05059814453125, -0.995361328125, -0.94012451171875, -0.8848876953125, -0.82965087890625, -0.7744140625, -0.71917724609375, -0.6639404296875, -0.60870361328125, -0.553466796875, -0.49822998046875, -0.4429931640625, -0.38775634765625, -0.33251953125, -0.27728271484375, -0.2220458984375, -0.16680908203125, -0.111572265625, -0.05633544921875, -0.0010986328125, 0.05413818359375, 0.109375, 0.16461181640625, 0.2198486328125, 0.27508544921875, 0.330322265625, 0.38555908203125, 0.4407958984375, 0.49603271484375, 0.55126953125, 0.60650634765625, 0.6617431640625, 0.71697998046875, 0.772216796875, 0.82745361328125, 0.8826904296875, 0.93792724609375, 0.9931640625, 1.04840087890625, 1.1036376953125, 1.15887451171875, 1.214111328125, 1.26934814453125, 1.3245849609375, 1.37982177734375, 1.43505859375, 1.49029541015625, 1.5455322265625, 1.60076904296875, 1.656005859375, 1.71124267578125, 1.7664794921875, 1.82171630859375, 1.876953125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 9.0, 16.0, 29.0, 41.0, 73.0, 97.0, 157.0, 186.0, 139.0, 105.0, 79.0, 35.0, 13.0, 10.0, 4.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.362564086914062, -19.562904357910156, -18.76324462890625, -17.963586807250977, -17.16392707824707, -16.364267349243164, -15.564608573913574, -14.764949798583984, -13.965290069580078, -13.165630340576172, -12.365971565246582, -11.566312789916992, -10.766653060913086, -9.96699333190918, -9.16733455657959, -8.36767578125, -7.568016052246094, -6.768356800079346, -5.968697547912598, -5.16903829574585, -4.369379043579102, -3.5697197914123535, -2.7700605392456055, -1.9704012870788574, -1.1707420349121094, -0.37108278274536133, 0.4285764694213867, 1.2282357215881348, 2.027894973754883, 2.827554225921631, 3.627213478088379, 4.426872730255127, 5.226533889770508, 6.026193141937256, 6.825852394104004, 7.625511646270752, 8.4251708984375, 9.224830627441406, 10.024489402770996, 10.824148178100586, 11.623807907104492, 12.423467636108398, 13.223126411437988, 14.022785186767578, 14.822444915771484, 15.62210464477539, 16.421764373779297, 17.22142219543457, 18.021081924438477, 18.820741653442383, 19.620399475097656, 20.420059204101562, 21.21971893310547, 22.019378662109375, 22.81903839111328, 23.618696212768555, 24.41835594177246, 25.218015670776367, 26.01767349243164, 26.817333221435547, 27.616992950439453, 28.41665267944336, 29.216312408447266, 30.01597023010254, 30.815629959106445]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 3.0, 5.0, 7.0, 6.0, 3.0, 14.0, 13.0, 19.0, 23.0, 21.0, 30.0, 24.0, 27.0, 36.0, 24.0, 37.0, 45.0, 41.0, 42.0, 43.0, 57.0, 45.0, 43.0, 43.0, 46.0, 38.0, 32.0, 35.0, 35.0, 28.0, 28.0, 21.0, 22.0, 18.0, 9.0, 10.0, 5.0, 10.0, 4.0, 7.0, 2.0, 4.0, 4.0, 1.0], "bins": [-19.779029846191406, -19.29183006286621, -18.80463218688965, -18.317432403564453, -17.830232620239258, -17.343032836914062, -16.8558349609375, -16.368635177612305, -15.881436347961426, -15.394237518310547, -14.907037734985352, -14.419838905334473, -13.932640075683594, -13.445440292358398, -12.95824146270752, -12.47104263305664, -11.983842849731445, -11.496644020080566, -11.009444236755371, -10.522245407104492, -10.035045623779297, -9.547846794128418, -9.060647964477539, -8.573448181152344, -8.086249351501465, -7.599050045013428, -7.111850738525391, -6.624651908874512, -6.137452602386475, -5.6502532958984375, -5.163054466247559, -4.6758551597595215, -4.188655853271484, -3.7014565467834473, -3.2142574787139893, -2.7270584106445312, -2.239859104156494, -1.752659797668457, -1.265460729598999, -0.778261661529541, -0.2910623550415039, 0.19613683223724365, 0.6833360195159912, 1.1705352067947388, 1.6577343940734863, 2.1449337005615234, 2.6321327686309814, 3.1193318367004395, 3.6065311431884766, 4.093730449676514, 4.580929756164551, 5.06812858581543, 5.555327892303467, 6.042527198791504, 6.529726028442383, 7.01692533493042, 7.504124641418457, 7.991323947906494, 8.478523254394531, 8.96572208404541, 9.452920913696289, 9.940120697021484, 10.427319526672363, 10.914518356323242, 11.401718139648438]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 8.0, 5.0, 12.0, 20.0, 27.0, 24.0, 62.0, 81.0, 145.0, 243.0, 404.0, 722.0, 1270.0, 2757.0, 6271.0, 16429.0, 62939.0, 3928942.0, 132884.0, 24876.0, 8551.0, 3725.0, 1845.0, 850.0, 516.0, 261.0, 136.0, 83.0, 41.0, 31.0, 20.0, 21.0, 15.0, 12.0, 10.0, 4.0, 5.0, 7.0, 4.0, 5.0, 5.0, 3.0, 1.0, 2.0, 3.0, 1.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.46875, -3.3087158203125, -3.148681640625, -2.9886474609375, -2.82861328125, -2.6685791015625, -2.508544921875, -2.3485107421875, -2.1884765625, -2.0284423828125, -1.868408203125, -1.7083740234375, -1.54833984375, -1.3883056640625, -1.228271484375, -1.0682373046875, -0.908203125, -0.7481689453125, -0.588134765625, -0.4281005859375, -0.26806640625, -0.1080322265625, 0.052001953125, 0.2120361328125, 0.3720703125, 0.5321044921875, 0.692138671875, 0.8521728515625, 1.01220703125, 1.1722412109375, 1.332275390625, 1.4923095703125, 1.65234375, 1.8123779296875, 1.972412109375, 2.1324462890625, 2.29248046875, 2.4525146484375, 2.612548828125, 2.7725830078125, 2.9326171875, 3.0926513671875, 3.252685546875, 3.4127197265625, 3.57275390625, 3.7327880859375, 3.892822265625, 4.0528564453125, 4.212890625, 4.3729248046875, 4.532958984375, 4.6929931640625, 4.85302734375, 5.0130615234375, 5.173095703125, 5.3331298828125, 5.4931640625, 5.6531982421875, 5.813232421875, 5.9732666015625, 6.13330078125, 6.2933349609375, 6.453369140625, 6.6134033203125, 6.7734375]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 7.0, 6.0, 12.0, 19.0, 23.0, 34.0, 44.0, 51.0, 60.0, 72.0, 86.0, 81.0, 74.0, 74.0, 64.0, 61.0, 66.0, 40.0, 30.0, 29.0, 25.0, 15.0, 11.0, 9.0, 4.0, 7.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.27734375, -1.2376708984375, -1.197998046875, -1.1583251953125, -1.11865234375, -1.0789794921875, -1.039306640625, -0.9996337890625, -0.9599609375, -0.9202880859375, -0.880615234375, -0.8409423828125, -0.80126953125, -0.7615966796875, -0.721923828125, -0.6822509765625, -0.642578125, -0.6029052734375, -0.563232421875, -0.5235595703125, -0.48388671875, -0.4442138671875, -0.404541015625, -0.3648681640625, -0.3251953125, -0.2855224609375, -0.245849609375, -0.2061767578125, -0.16650390625, -0.1268310546875, -0.087158203125, -0.0474853515625, -0.0078125, 0.0318603515625, 0.071533203125, 0.1112060546875, 0.15087890625, 0.1905517578125, 0.230224609375, 0.2698974609375, 0.3095703125, 0.3492431640625, 0.388916015625, 0.4285888671875, 0.46826171875, 0.5079345703125, 0.547607421875, 0.5872802734375, 0.626953125, 0.6666259765625, 0.706298828125, 0.7459716796875, 0.78564453125, 0.8253173828125, 0.864990234375, 0.9046630859375, 0.9443359375, 0.9840087890625, 1.023681640625, 1.0633544921875, 1.10302734375, 1.1427001953125, 1.182373046875, 1.2220458984375, 1.26171875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 5.0, 15.0, 17.0, 22.0, 30.0, 32.0, 64.0, 106.0, 117.0, 174.0, 280.0, 506.0, 854.0, 1579.0, 3129.0, 7122.0, 20382.0, 103587.0, 3910521.0, 110431.0, 21171.0, 7308.0, 3003.0, 1548.0, 842.0, 491.0, 306.0, 203.0, 144.0, 72.0, 68.0, 57.0, 31.0, 18.0, 9.0, 11.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5625, -4.417724609375, -4.27294921875, -4.128173828125, -3.9833984375, -3.838623046875, -3.69384765625, -3.549072265625, -3.404296875, -3.259521484375, -3.11474609375, -2.969970703125, -2.8251953125, -2.680419921875, -2.53564453125, -2.390869140625, -2.24609375, -2.101318359375, -1.95654296875, -1.811767578125, -1.6669921875, -1.522216796875, -1.37744140625, -1.232666015625, -1.087890625, -0.943115234375, -0.79833984375, -0.653564453125, -0.5087890625, -0.364013671875, -0.21923828125, -0.074462890625, 0.0703125, 0.215087890625, 0.35986328125, 0.504638671875, 0.6494140625, 0.794189453125, 0.93896484375, 1.083740234375, 1.228515625, 1.373291015625, 1.51806640625, 1.662841796875, 1.8076171875, 1.952392578125, 2.09716796875, 2.241943359375, 2.38671875, 2.531494140625, 2.67626953125, 2.821044921875, 2.9658203125, 3.110595703125, 3.25537109375, 3.400146484375, 3.544921875, 3.689697265625, 3.83447265625, 3.979248046875, 4.1240234375, 4.268798828125, 4.41357421875, 4.558349609375, 4.703125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 13.0, 14.0, 18.0, 21.0, 42.0, 68.0, 168.0, 2679.0, 712.0, 144.0, 45.0, 40.0, 22.0, 17.0, 18.0, 5.0, 8.0, 3.0, 4.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6767578125, -1.6186676025390625, -1.560577392578125, -1.5024871826171875, -1.44439697265625, -1.3863067626953125, -1.328216552734375, -1.2701263427734375, -1.2120361328125, -1.1539459228515625, -1.095855712890625, -1.0377655029296875, -0.97967529296875, -0.9215850830078125, -0.863494873046875, -0.8054046630859375, -0.747314453125, -0.6892242431640625, -0.631134033203125, -0.5730438232421875, -0.51495361328125, -0.4568634033203125, -0.398773193359375, -0.3406829833984375, -0.2825927734375, -0.2245025634765625, -0.166412353515625, -0.1083221435546875, -0.05023193359375, 0.0078582763671875, 0.065948486328125, 0.1240386962890625, 0.18212890625, 0.2402191162109375, 0.298309326171875, 0.3563995361328125, 0.41448974609375, 0.4725799560546875, 0.530670166015625, 0.5887603759765625, 0.6468505859375, 0.7049407958984375, 0.763031005859375, 0.8211212158203125, 0.87921142578125, 0.9373016357421875, 0.995391845703125, 1.0534820556640625, 1.111572265625, 1.1696624755859375, 1.227752685546875, 1.2858428955078125, 1.34393310546875, 1.4020233154296875, 1.460113525390625, 1.5182037353515625, 1.5762939453125, 1.6343841552734375, 1.692474365234375, 1.7505645751953125, 1.80865478515625, 1.8667449951171875, 1.924835205078125, 1.9829254150390625, 2.041015625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 26.0, 28.0, 52.0, 137.0, 232.0, 248.0, 134.0, 64.0, 28.0, 18.0, 12.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.277240753173828, -9.908409118652344, -9.53957748413086, -9.170746803283691, -8.801915168762207, -8.433083534240723, -8.064252853393555, -7.69542121887207, -7.326589584350586, -6.957757949829102, -6.588926792144775, -6.220095634460449, -5.851263999938965, -5.4824323654174805, -5.113601207733154, -4.744770050048828, -4.375938415527344, -4.007106781005859, -3.638275623321533, -3.269444227218628, -2.9006128311157227, -2.5317814350128174, -2.162950038909912, -1.7941186428070068, -1.4252872467041016, -1.0564558506011963, -0.687624454498291, -0.31879305839538574, 0.05003833770751953, 0.4188697338104248, 0.7877011299133301, 1.1565325260162354, 1.5253629684448242, 1.8941943645477295, 2.2630257606506348, 2.63185715675354, 3.0006885528564453, 3.3695199489593506, 3.738351345062256, 4.107182502746582, 4.476014137268066, 4.844845771789551, 5.213676929473877, 5.582508087158203, 5.9513397216796875, 6.320171356201172, 6.689002513885498, 7.057833671569824, 7.426665306091309, 7.795496940612793, 8.164327621459961, 8.533159255981445, 8.90199089050293, 9.270822525024414, 9.639654159545898, 10.008484840393066, 10.37731647491455, 10.746148109436035, 11.114978790283203, 11.483810424804688, 11.852642059326172, 12.221473693847656, 12.59030532836914, 12.959136009216309, 13.327967643737793]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 5.0, 10.0, 4.0, 14.0, 21.0, 31.0, 22.0, 30.0, 34.0, 39.0, 49.0, 54.0, 78.0, 57.0, 53.0, 54.0, 58.0, 51.0, 58.0, 54.0, 41.0, 33.0, 31.0, 31.0, 23.0, 21.0, 12.0, 10.0, 5.0, 10.0, 1.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.140196323394775, -4.968681812286377, -4.79716682434082, -4.625652313232422, -4.454137802124023, -4.282622814178467, -4.111108303070068, -3.939593553543091, -3.7680788040161133, -3.5965640544891357, -3.425049304962158, -3.2535347938537598, -3.0820200443267822, -2.9105052947998047, -2.7389907836914062, -2.5674760341644287, -2.395961284637451, -2.2244465351104736, -2.052931785583496, -1.8814172744750977, -1.7099025249481201, -1.5383877754211426, -1.3668731451034546, -1.1953585147857666, -1.023843765258789, -0.8523290753364563, -0.6808143854141235, -0.5092996954917908, -0.337785005569458, -0.16627031564712524, 0.0052443742752075195, 0.1767590045928955, 0.34827423095703125, 0.519788920879364, 0.6913036108016968, 0.8628183007240295, 1.0343329906463623, 1.2058477401733398, 1.3773623704910278, 1.5488770008087158, 1.7203917503356934, 1.891906499862671, 2.0634212493896484, 2.234935760498047, 2.4064505100250244, 2.577965259552002, 2.7494797706604004, 2.920994520187378, 3.0925092697143555, 3.264024019241333, 3.4355387687683105, 3.607053279876709, 3.7785680294036865, 3.950082778930664, 4.1215972900390625, 4.293111801147461, 4.464626789093018, 4.636141300201416, 4.807656288146973, 4.979170799255371, 5.1506853103637695, 5.322200298309326, 5.493714809417725, 5.665229797363281, 5.83674430847168]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 8.0, 1.0, 5.0, 6.0, 6.0, 5.0, 12.0, 21.0, 27.0, 51.0, 72.0, 154.0, 277.0, 636.0, 1342.0, 3591.0, 10640.0, 38888.0, 177852.0, 581622.0, 177391.0, 39100.0, 10657.0, 3655.0, 1344.0, 545.0, 261.0, 143.0, 84.0, 61.0, 26.0, 19.0, 10.0, 14.0, 8.0, 9.0, 4.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-4.515625, -4.39190673828125, -4.2681884765625, -4.14447021484375, -4.020751953125, -3.89703369140625, -3.7733154296875, -3.64959716796875, -3.52587890625, -3.40216064453125, -3.2784423828125, -3.15472412109375, -3.031005859375, -2.90728759765625, -2.7835693359375, -2.65985107421875, -2.5361328125, -2.41241455078125, -2.2886962890625, -2.16497802734375, -2.041259765625, -1.91754150390625, -1.7938232421875, -1.67010498046875, -1.54638671875, -1.42266845703125, -1.2989501953125, -1.17523193359375, -1.051513671875, -0.92779541015625, -0.8040771484375, -0.68035888671875, -0.556640625, -0.43292236328125, -0.3092041015625, -0.18548583984375, -0.061767578125, 0.06195068359375, 0.1856689453125, 0.30938720703125, 0.43310546875, 0.55682373046875, 0.6805419921875, 0.80426025390625, 0.927978515625, 1.05169677734375, 1.1754150390625, 1.29913330078125, 1.4228515625, 1.54656982421875, 1.6702880859375, 1.79400634765625, 1.917724609375, 2.04144287109375, 2.1651611328125, 2.28887939453125, 2.41259765625, 2.53631591796875, 2.6600341796875, 2.78375244140625, 2.907470703125, 3.03118896484375, 3.1549072265625, 3.27862548828125, 3.40234375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 10.0, 15.0, 21.0, 14.0, 22.0, 36.0, 40.0, 42.0, 60.0, 60.0, 82.0, 76.0, 75.0, 68.0, 66.0, 56.0, 36.0, 39.0, 34.0, 33.0, 30.0, 24.0, 14.0, 16.0, 10.0, 9.0, 6.0, 6.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0166015625, -0.98095703125, -0.9453125, -0.90966796875, -0.8740234375, -0.83837890625, -0.802734375, -0.76708984375, -0.7314453125, -0.69580078125, -0.66015625, -0.62451171875, -0.5888671875, -0.55322265625, -0.517578125, -0.48193359375, -0.4462890625, -0.41064453125, -0.375, -0.33935546875, -0.3037109375, -0.26806640625, -0.232421875, -0.19677734375, -0.1611328125, -0.12548828125, -0.08984375, -0.05419921875, -0.0185546875, 0.01708984375, 0.052734375, 0.08837890625, 0.1240234375, 0.15966796875, 0.1953125, 0.23095703125, 0.2666015625, 0.30224609375, 0.337890625, 0.37353515625, 0.4091796875, 0.44482421875, 0.48046875, 0.51611328125, 0.5517578125, 0.58740234375, 0.623046875, 0.65869140625, 0.6943359375, 0.72998046875, 0.765625, 0.80126953125, 0.8369140625, 0.87255859375, 0.908203125, 0.94384765625, 0.9794921875, 1.01513671875, 1.05078125, 1.08642578125, 1.1220703125, 1.15771484375, 1.193359375, 1.22900390625, 1.2646484375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 8.0, 9.0, 7.0, 9.0, 28.0, 34.0, 53.0, 75.0, 162.0, 246.0, 560.0, 1276.0, 4223.0, 16036.0, 74170.0, 433271.0, 423077.0, 72955.0, 15890.0, 4055.0, 1226.0, 533.0, 282.0, 146.0, 87.0, 54.0, 29.0, 21.0, 11.0, 12.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.40234375, -4.292266845703125, -4.18218994140625, -4.072113037109375, -3.9620361328125, -3.851959228515625, -3.74188232421875, -3.631805419921875, -3.521728515625, -3.411651611328125, -3.30157470703125, -3.191497802734375, -3.0814208984375, -2.971343994140625, -2.86126708984375, -2.751190185546875, -2.64111328125, -2.531036376953125, -2.42095947265625, -2.310882568359375, -2.2008056640625, -2.090728759765625, -1.98065185546875, -1.870574951171875, -1.760498046875, -1.650421142578125, -1.54034423828125, -1.430267333984375, -1.3201904296875, -1.210113525390625, -1.10003662109375, -0.989959716796875, -0.8798828125, -0.769805908203125, -0.65972900390625, -0.549652099609375, -0.4395751953125, -0.329498291015625, -0.21942138671875, -0.109344482421875, 0.000732421875, 0.110809326171875, 0.22088623046875, 0.330963134765625, 0.4410400390625, 0.551116943359375, 0.66119384765625, 0.771270751953125, 0.88134765625, 0.991424560546875, 1.10150146484375, 1.211578369140625, 1.3216552734375, 1.431732177734375, 1.54180908203125, 1.651885986328125, 1.761962890625, 1.872039794921875, 1.98211669921875, 2.092193603515625, 2.2022705078125, 2.312347412109375, 2.42242431640625, 2.532501220703125, 2.642578125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 8.0, 9.0, 7.0, 13.0, 28.0, 23.0, 24.0, 29.0, 28.0, 31.0, 49.0, 41.0, 47.0, 49.0, 47.0, 45.0, 44.0, 51.0, 56.0, 36.0, 32.0, 36.0, 33.0, 36.0, 34.0, 26.0, 23.0, 22.0, 14.0, 15.0, 14.0, 10.0, 9.0, 8.0, 7.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 3.0], "bins": [-4.38671875, -4.272979736328125, -4.15924072265625, -4.045501708984375, -3.9317626953125, -3.818023681640625, -3.70428466796875, -3.590545654296875, -3.476806640625, -3.363067626953125, -3.24932861328125, -3.135589599609375, -3.0218505859375, -2.908111572265625, -2.79437255859375, -2.680633544921875, -2.56689453125, -2.453155517578125, -2.33941650390625, -2.225677490234375, -2.1119384765625, -1.998199462890625, -1.88446044921875, -1.770721435546875, -1.656982421875, -1.543243408203125, -1.42950439453125, -1.315765380859375, -1.2020263671875, -1.088287353515625, -0.97454833984375, -0.860809326171875, -0.7470703125, -0.633331298828125, -0.51959228515625, -0.405853271484375, -0.2921142578125, -0.178375244140625, -0.06463623046875, 0.049102783203125, 0.162841796875, 0.276580810546875, 0.39031982421875, 0.504058837890625, 0.6177978515625, 0.731536865234375, 0.84527587890625, 0.959014892578125, 1.07275390625, 1.186492919921875, 1.30023193359375, 1.413970947265625, 1.5277099609375, 1.641448974609375, 1.75518798828125, 1.868927001953125, 1.982666015625, 2.096405029296875, 2.21014404296875, 2.323883056640625, 2.4376220703125, 2.551361083984375, 2.66510009765625, 2.778839111328125, 2.892578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 15.0, 31.0, 29.0, 85.0, 138.0, 341.0, 708.0, 1685.0, 4825.0, 19883.0, 199518.0, 743370.0, 62684.0, 10224.0, 2891.0, 1154.0, 473.0, 201.0, 124.0, 69.0, 27.0, 16.0, 17.0, 9.0, 4.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.71484375, -2.6457366943359375, -2.576629638671875, -2.5075225830078125, -2.43841552734375, -2.3693084716796875, -2.300201416015625, -2.2310943603515625, -2.1619873046875, -2.0928802490234375, -2.023773193359375, -1.9546661376953125, -1.88555908203125, -1.8164520263671875, -1.747344970703125, -1.6782379150390625, -1.609130859375, -1.5400238037109375, -1.470916748046875, -1.4018096923828125, -1.33270263671875, -1.2635955810546875, -1.194488525390625, -1.1253814697265625, -1.0562744140625, -0.9871673583984375, -0.918060302734375, -0.8489532470703125, -0.77984619140625, -0.7107391357421875, -0.641632080078125, -0.5725250244140625, -0.50341796875, -0.4343109130859375, -0.365203857421875, -0.2960968017578125, -0.22698974609375, -0.1578826904296875, -0.088775634765625, -0.0196685791015625, 0.0494384765625, 0.1185455322265625, 0.187652587890625, 0.2567596435546875, 0.32586669921875, 0.3949737548828125, 0.464080810546875, 0.5331878662109375, 0.602294921875, 0.6714019775390625, 0.740509033203125, 0.8096160888671875, 0.87872314453125, 0.9478302001953125, 1.016937255859375, 1.0860443115234375, 1.1551513671875, 1.2242584228515625, 1.293365478515625, 1.3624725341796875, 1.43157958984375, 1.5006866455078125, 1.569793701171875, 1.6389007568359375, 1.7080078125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 6.0, 6.0, 11.0, 5.0, 9.0, 16.0, 23.0, 37.0, 55.0, 49.0, 133.0, 148.0, 147.0, 104.0, 63.0, 60.0, 31.0, 13.0, 20.0, 16.0, 16.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002944469451904297, -0.00028603896498680115, -0.0002776309847831726, -0.00026922300457954407, -0.00026081502437591553, -0.000252407044172287, -0.00024399906396865845, -0.0002355910837650299, -0.00022718310356140137, -0.00021877512335777283, -0.0002103671431541443, -0.00020195916295051575, -0.0001935511827468872, -0.00018514320254325867, -0.00017673522233963013, -0.0001683272421360016, -0.00015991926193237305, -0.0001515112817287445, -0.00014310330152511597, -0.00013469532132148743, -0.0001262873411178589, -0.00011787936091423035, -0.0001094713807106018, -0.00010106340050697327, -9.265542030334473e-05, -8.424744009971619e-05, -7.583945989608765e-05, -6.74314796924591e-05, -5.9023499488830566e-05, -5.0615519285202026e-05, -4.2207539081573486e-05, -3.3799558877944946e-05, -2.5391578674316406e-05, -1.6983598470687866e-05, -8.575618267059326e-06, -1.6763806343078613e-07, 8.240342140197754e-06, 1.6648322343826294e-05, 2.5056302547454834e-05, 3.3464282751083374e-05, 4.1872262954711914e-05, 5.0280243158340454e-05, 5.8688223361968994e-05, 6.709620356559753e-05, 7.550418376922607e-05, 8.391216397285461e-05, 9.232014417648315e-05, 0.0001007281243801117, 0.00010913610458374023, 0.00011754408478736877, 0.00012595206499099731, 0.00013436004519462585, 0.0001427680253982544, 0.00015117600560188293, 0.00015958398580551147, 0.00016799196600914001, 0.00017639994621276855, 0.0001848079264163971, 0.00019321590662002563, 0.00020162388682365417, 0.00021003186702728271, 0.00021843984723091125, 0.0002268478274345398, 0.00023525580763816833, 0.00024366378784179688]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 7.0, 17.0, 13.0, 13.0, 19.0, 32.0, 46.0, 78.0, 112.0, 207.0, 357.0, 744.0, 1602.0, 4528.0, 16832.0, 108477.0, 739067.0, 147364.0, 20445.0, 5092.0, 1821.0, 698.0, 394.0, 213.0, 157.0, 86.0, 40.0, 36.0, 14.0, 16.0, 7.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.447265625, -2.378448486328125, -2.30963134765625, -2.240814208984375, -2.1719970703125, -2.103179931640625, -2.03436279296875, -1.965545654296875, -1.896728515625, -1.827911376953125, -1.75909423828125, -1.690277099609375, -1.6214599609375, -1.552642822265625, -1.48382568359375, -1.415008544921875, -1.34619140625, -1.277374267578125, -1.20855712890625, -1.139739990234375, -1.0709228515625, -1.002105712890625, -0.93328857421875, -0.864471435546875, -0.795654296875, -0.726837158203125, -0.65802001953125, -0.589202880859375, -0.5203857421875, -0.451568603515625, -0.38275146484375, -0.313934326171875, -0.2451171875, -0.176300048828125, -0.10748291015625, -0.038665771484375, 0.0301513671875, 0.098968505859375, 0.16778564453125, 0.236602783203125, 0.305419921875, 0.374237060546875, 0.44305419921875, 0.511871337890625, 0.5806884765625, 0.649505615234375, 0.71832275390625, 0.787139892578125, 0.85595703125, 0.924774169921875, 0.99359130859375, 1.062408447265625, 1.1312255859375, 1.200042724609375, 1.26885986328125, 1.337677001953125, 1.406494140625, 1.475311279296875, 1.54412841796875, 1.612945556640625, 1.6817626953125, 1.750579833984375, 1.81939697265625, 1.888214111328125, 1.95703125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 10.0, 8.0, 14.0, 13.0, 25.0, 44.0, 65.0, 129.0, 175.0, 177.0, 129.0, 78.0, 56.0, 19.0, 16.0, 13.0, 8.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.22265625, -3.138214111328125, -3.05377197265625, -2.969329833984375, -2.8848876953125, -2.800445556640625, -2.71600341796875, -2.631561279296875, -2.547119140625, -2.462677001953125, -2.37823486328125, -2.293792724609375, -2.2093505859375, -2.124908447265625, -2.04046630859375, -1.956024169921875, -1.87158203125, -1.787139892578125, -1.70269775390625, -1.618255615234375, -1.5338134765625, -1.449371337890625, -1.36492919921875, -1.280487060546875, -1.196044921875, -1.111602783203125, -1.02716064453125, -0.942718505859375, -0.8582763671875, -0.773834228515625, -0.68939208984375, -0.604949951171875, -0.5205078125, -0.436065673828125, -0.35162353515625, -0.267181396484375, -0.1827392578125, -0.098297119140625, -0.01385498046875, 0.070587158203125, 0.155029296875, 0.239471435546875, 0.32391357421875, 0.408355712890625, 0.4927978515625, 0.577239990234375, 0.66168212890625, 0.746124267578125, 0.83056640625, 0.915008544921875, 0.99945068359375, 1.083892822265625, 1.1683349609375, 1.252777099609375, 1.33721923828125, 1.421661376953125, 1.506103515625, 1.590545654296875, 1.67498779296875, 1.759429931640625, 1.8438720703125, 1.928314208984375, 2.01275634765625, 2.097198486328125, 2.181640625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 18.0, 77.0, 266.0, 428.0, 165.0, 45.0, 10.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.16051483154297, -33.79642868041992, -31.432342529296875, -29.068256378173828, -26.70417022705078, -24.340084075927734, -21.975997924804688, -19.61191177368164, -17.247825622558594, -14.883739471435547, -12.5196533203125, -10.155567169189453, -7.791481018066406, -5.427394866943359, -3.0633087158203125, -0.6992225646972656, 1.6648635864257812, 4.028949737548828, 6.393035888671875, 8.757122039794922, 11.121208190917969, 13.485294342041016, 15.849380493164062, 18.21346664428711, 20.577552795410156, 22.941638946533203, 25.30572509765625, 27.669811248779297, 30.033897399902344, 32.39798355102539, 34.76206970214844, 37.126155853271484, 39.490234375, 41.85432052612305, 44.218406677246094, 46.58249282836914, 48.94657897949219, 51.310665130615234, 53.67475128173828, 56.03883743286133, 58.402923583984375, 60.76700973510742, 63.13109588623047, 65.49517822265625, 67.85926818847656, 70.22335815429688, 72.58744049072266, 74.95152282714844, 77.31561279296875, 79.67970275878906, 82.04378509521484, 84.40786743164062, 86.77195739746094, 89.13604736328125, 91.50012969970703, 93.86421203613281, 96.22830200195312, 98.59239196777344, 100.95647430419922, 103.320556640625, 105.68464660644531, 108.04873657226562, 110.4128189086914, 112.77690124511719, 115.1409912109375]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 6.0, 0.0, 5.0, 7.0, 9.0, 8.0, 16.0, 17.0, 22.0, 21.0, 28.0, 27.0, 26.0, 37.0, 24.0, 24.0, 37.0, 42.0, 30.0, 47.0, 36.0, 41.0, 43.0, 46.0, 35.0, 25.0, 28.0, 28.0, 33.0, 35.0, 21.0, 29.0, 23.0, 28.0, 22.0, 21.0, 11.0, 10.0, 11.0, 11.0, 7.0, 7.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.09040641784668, -16.554485321044922, -16.018566131591797, -15.482645988464355, -14.946725845336914, -14.410805702209473, -13.874885559082031, -13.33896541595459, -12.803045272827148, -12.267125129699707, -11.731204986572266, -11.195284843444824, -10.659364700317383, -10.123444557189941, -9.5875244140625, -9.051604270935059, -8.515684127807617, -7.979763984680176, -7.443843841552734, -6.907923698425293, -6.372003555297852, -5.83608341217041, -5.300163269042969, -4.764243125915527, -4.228322982788086, -3.6924028396606445, -3.156482696533203, -2.6205625534057617, -2.0846424102783203, -1.548722267150879, -1.0128021240234375, -0.4768819808959961, 0.059040069580078125, 0.5949602127075195, 1.130880355834961, 1.6668004989624023, 2.2027206420898438, 2.738640785217285, 3.2745609283447266, 3.810481071472168, 4.346401214599609, 4.882321357727051, 5.418241500854492, 5.954161643981934, 6.490081787109375, 7.026001930236816, 7.561922073364258, 8.0978422164917, 8.63376235961914, 9.169682502746582, 9.705602645874023, 10.241522789001465, 10.777442932128906, 11.313363075256348, 11.849283218383789, 12.38520336151123, 12.921123504638672, 13.457043647766113, 13.992963790893555, 14.528883934020996, 15.064804077148438, 15.600724220275879, 16.13664436340332, 16.672565460205078, 17.208484649658203]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 7.0, 21.0, 31.0, 56.0, 115.0, 215.0, 456.0, 1240.0, 3374.0, 12545.0, 83906.0, 4020917.0, 57434.0, 9517.0, 2671.0, 921.0, 400.0, 174.0, 111.0, 52.0, 37.0, 16.0, 11.0, 13.0, 4.0, 11.0, 8.0, 9.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7890625, -4.5545654296875, -4.320068359375, -4.0855712890625, -3.85107421875, -3.6165771484375, -3.382080078125, -3.1475830078125, -2.9130859375, -2.6785888671875, -2.444091796875, -2.2095947265625, -1.97509765625, -1.7406005859375, -1.506103515625, -1.2716064453125, -1.037109375, -0.8026123046875, -0.568115234375, -0.3336181640625, -0.09912109375, 0.1353759765625, 0.369873046875, 0.6043701171875, 0.8388671875, 1.0733642578125, 1.307861328125, 1.5423583984375, 1.77685546875, 2.0113525390625, 2.245849609375, 2.4803466796875, 2.71484375, 2.9493408203125, 3.183837890625, 3.4183349609375, 3.65283203125, 3.8873291015625, 4.121826171875, 4.3563232421875, 4.5908203125, 4.8253173828125, 5.059814453125, 5.2943115234375, 5.52880859375, 5.7633056640625, 5.997802734375, 6.2322998046875, 6.466796875, 6.7012939453125, 6.935791015625, 7.1702880859375, 7.40478515625, 7.6392822265625, 7.873779296875, 8.1082763671875, 8.3427734375, 8.5772705078125, 8.811767578125, 9.0462646484375, 9.28076171875, 9.5152587890625, 9.749755859375, 9.9842529296875, 10.21875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 9.0, 4.0, 7.0, 6.0, 14.0, 22.0, 27.0, 28.0, 33.0, 34.0, 42.0, 30.0, 53.0, 64.0, 67.0, 63.0, 57.0, 56.0, 70.0, 68.0, 44.0, 49.0, 30.0, 23.0, 27.0, 12.0, 14.0, 8.0, 15.0, 6.0, 5.0, 9.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.232421875, -1.1948699951171875, -1.157318115234375, -1.1197662353515625, -1.08221435546875, -1.0446624755859375, -1.007110595703125, -0.9695587158203125, -0.9320068359375, -0.8944549560546875, -0.856903076171875, -0.8193511962890625, -0.78179931640625, -0.7442474365234375, -0.706695556640625, -0.6691436767578125, -0.631591796875, -0.5940399169921875, -0.556488037109375, -0.5189361572265625, -0.48138427734375, -0.4438323974609375, -0.406280517578125, -0.3687286376953125, -0.3311767578125, -0.2936248779296875, -0.256072998046875, -0.2185211181640625, -0.18096923828125, -0.1434173583984375, -0.105865478515625, -0.0683135986328125, -0.03076171875, 0.0067901611328125, 0.044342041015625, 0.0818939208984375, 0.11944580078125, 0.1569976806640625, 0.194549560546875, 0.2321014404296875, 0.2696533203125, 0.3072052001953125, 0.344757080078125, 0.3823089599609375, 0.41986083984375, 0.4574127197265625, 0.494964599609375, 0.5325164794921875, 0.570068359375, 0.6076202392578125, 0.645172119140625, 0.6827239990234375, 0.72027587890625, 0.7578277587890625, 0.795379638671875, 0.8329315185546875, 0.8704833984375, 0.9080352783203125, 0.945587158203125, 0.9831390380859375, 1.02069091796875, 1.0582427978515625, 1.095794677734375, 1.1333465576171875, 1.1708984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 4.0, 7.0, 12.0, 12.0, 9.0, 22.0, 28.0, 43.0, 79.0, 86.0, 137.0, 161.0, 247.0, 338.0, 491.0, 755.0, 1128.0, 1815.0, 2987.0, 5204.0, 10131.0, 22216.0, 60485.0, 347261.0, 3538200.0, 131734.0, 37091.0, 15237.0, 7407.0, 4170.0, 2332.0, 1440.0, 941.0, 623.0, 432.0, 293.0, 205.0, 144.0, 100.0, 80.0, 48.0, 53.0, 20.0, 20.0, 21.0, 15.0, 4.0, 7.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.53125, -2.4503173828125, -2.369384765625, -2.2884521484375, -2.20751953125, -2.1265869140625, -2.045654296875, -1.9647216796875, -1.8837890625, -1.8028564453125, -1.721923828125, -1.6409912109375, -1.56005859375, -1.4791259765625, -1.398193359375, -1.3172607421875, -1.236328125, -1.1553955078125, -1.074462890625, -0.9935302734375, -0.91259765625, -0.8316650390625, -0.750732421875, -0.6697998046875, -0.5888671875, -0.5079345703125, -0.427001953125, -0.3460693359375, -0.26513671875, -0.1842041015625, -0.103271484375, -0.0223388671875, 0.05859375, 0.1395263671875, 0.220458984375, 0.3013916015625, 0.38232421875, 0.4632568359375, 0.544189453125, 0.6251220703125, 0.7060546875, 0.7869873046875, 0.867919921875, 0.9488525390625, 1.02978515625, 1.1107177734375, 1.191650390625, 1.2725830078125, 1.353515625, 1.4344482421875, 1.515380859375, 1.5963134765625, 1.67724609375, 1.7581787109375, 1.839111328125, 1.9200439453125, 2.0009765625, 2.0819091796875, 2.162841796875, 2.2437744140625, 2.32470703125, 2.4056396484375, 2.486572265625, 2.5675048828125, 2.6484375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 6.0, 5.0, 11.0, 11.0, 19.0, 18.0, 32.0, 62.0, 106.0, 384.0, 2897.0, 272.0, 109.0, 41.0, 28.0, 23.0, 13.0, 20.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.80859375, -2.72698974609375, -2.6453857421875, -2.56378173828125, -2.482177734375, -2.40057373046875, -2.3189697265625, -2.23736572265625, -2.15576171875, -2.07415771484375, -1.9925537109375, -1.91094970703125, -1.829345703125, -1.74774169921875, -1.6661376953125, -1.58453369140625, -1.5029296875, -1.42132568359375, -1.3397216796875, -1.25811767578125, -1.176513671875, -1.09490966796875, -1.0133056640625, -0.93170166015625, -0.85009765625, -0.76849365234375, -0.6868896484375, -0.60528564453125, -0.523681640625, -0.44207763671875, -0.3604736328125, -0.27886962890625, -0.197265625, -0.11566162109375, -0.0340576171875, 0.04754638671875, 0.129150390625, 0.21075439453125, 0.2923583984375, 0.37396240234375, 0.45556640625, 0.53717041015625, 0.6187744140625, 0.70037841796875, 0.781982421875, 0.86358642578125, 0.9451904296875, 1.02679443359375, 1.1083984375, 1.19000244140625, 1.2716064453125, 1.35321044921875, 1.434814453125, 1.51641845703125, 1.5980224609375, 1.67962646484375, 1.76123046875, 1.84283447265625, 1.9244384765625, 2.00604248046875, 2.087646484375, 2.16925048828125, 2.2508544921875, 2.33245849609375, 2.4140625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 5.0, 26.0, 55.0, 115.0, 245.0, 276.0, 156.0, 81.0, 24.0, 12.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.386353492736816, -11.836167335510254, -11.285981178283691, -10.735794067382812, -10.18560791015625, -9.635421752929688, -9.085235595703125, -8.535049438476562, -7.984862804412842, -7.434676647186279, -6.884490013122559, -6.334303855895996, -5.784117698669434, -5.233931064605713, -4.68374490737915, -4.13355827331543, -3.583372116088867, -3.0331857204437256, -2.482999324798584, -1.9328131675720215, -1.3826267719268799, -0.8324403762817383, -0.2822542190551758, 0.2679321765899658, 0.8181185722351074, 1.368304967880249, 1.918491244316101, 2.468677520751953, 3.0188639163970947, 3.5690503120422363, 4.119236469268799, 4.6694231033325195, 5.219610214233398, 5.769796371459961, 6.319983005523682, 6.870169162750244, 7.420355796813965, 7.970541954040527, 8.52072811126709, 9.070914268493652, 9.621101379394531, 10.171287536621094, 10.721473693847656, 11.271659851074219, 11.821846961975098, 12.37203311920166, 12.922219276428223, 13.472405433654785, 14.022591590881348, 14.57277774810791, 15.122963905334473, 15.673151016235352, 16.223337173461914, 16.773523330688477, 17.32370948791504, 17.8738956451416, 18.424081802368164, 18.974267959594727, 19.52445411682129, 20.07464027404785, 20.624826431274414, 21.17501449584961, 21.725200653076172, 22.275386810302734, 22.825572967529297]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 5.0, 11.0, 7.0, 19.0, 23.0, 14.0, 18.0, 21.0, 40.0, 41.0, 33.0, 54.0, 54.0, 50.0, 51.0, 60.0, 58.0, 47.0, 49.0, 44.0, 50.0, 39.0, 45.0, 34.0, 26.0, 21.0, 20.0, 18.0, 12.0, 9.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.717714309692383, -4.512407302856445, -4.307100772857666, -4.1017937660217285, -3.89648699760437, -3.6911802291870117, -3.4858734607696533, -3.280566692352295, -3.0752596855163574, -2.869952917098999, -2.6646461486816406, -2.459339141845703, -2.2540323734283447, -2.0487256050109863, -1.843418836593628, -1.63811194896698, -1.4328052997589111, -1.2274985313415527, -1.0221916437149048, -0.8168848752975464, -0.6115780472755432, -0.40627121925354004, -0.20096445083618164, 0.004342436790466309, 0.2096492052078247, 0.4149560332298279, 0.620262861251831, 0.8255696296691895, 1.0308763980865479, 1.2361832857131958, 1.4414900541305542, 1.6467969417572021, 1.8521037101745605, 2.057410478591919, 2.2627172470092773, 2.468024253845215, 2.6733310222625732, 2.8786377906799316, 3.08394455909729, 3.2892513275146484, 3.494558334350586, 3.6998651027679443, 3.9051718711853027, 4.11047887802124, 4.3157854080200195, 4.521092414855957, 4.7263994216918945, 4.931705951690674, 5.137012481689453, 5.342319488525391, 5.54762601852417, 5.752933025360107, 5.958239555358887, 6.163546562194824, 6.368853569030762, 6.574160099029541, 6.7794671058654785, 6.984774112701416, 7.190080642700195, 7.395387649536133, 7.600694179534912, 7.80600118637085, 8.011307716369629, 8.216614723205566, 8.421921730041504]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 7.0, 1.0, 6.0, 7.0, 15.0, 8.0, 19.0, 30.0, 75.0, 150.0, 290.0, 731.0, 2206.0, 8465.0, 46912.0, 409523.0, 507597.0, 58387.0, 10117.0, 2520.0, 829.0, 333.0, 139.0, 81.0, 40.0, 24.0, 19.0, 11.0, 6.0, 3.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.07421875, -4.9053955078125, -4.736572265625, -4.5677490234375, -4.39892578125, -4.2301025390625, -4.061279296875, -3.8924560546875, -3.7236328125, -3.5548095703125, -3.385986328125, -3.2171630859375, -3.04833984375, -2.8795166015625, -2.710693359375, -2.5418701171875, -2.373046875, -2.2042236328125, -2.035400390625, -1.8665771484375, -1.69775390625, -1.5289306640625, -1.360107421875, -1.1912841796875, -1.0224609375, -0.8536376953125, -0.684814453125, -0.5159912109375, -0.34716796875, -0.1783447265625, -0.009521484375, 0.1593017578125, 0.328125, 0.4969482421875, 0.665771484375, 0.8345947265625, 1.00341796875, 1.1722412109375, 1.341064453125, 1.5098876953125, 1.6787109375, 1.8475341796875, 2.016357421875, 2.1851806640625, 2.35400390625, 2.5228271484375, 2.691650390625, 2.8604736328125, 3.029296875, 3.1981201171875, 3.366943359375, 3.5357666015625, 3.70458984375, 3.8734130859375, 4.042236328125, 4.2110595703125, 4.3798828125, 4.5487060546875, 4.717529296875, 4.8863525390625, 5.05517578125, 5.2239990234375, 5.392822265625, 5.5616455078125, 5.73046875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 11.0, 11.0, 22.0, 16.0, 23.0, 21.0, 35.0, 34.0, 47.0, 36.0, 57.0, 54.0, 56.0, 49.0, 77.0, 72.0, 59.0, 60.0, 46.0, 45.0, 45.0, 25.0, 25.0, 14.0, 18.0, 12.0, 11.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2978515625, -1.257110595703125, -1.21636962890625, -1.175628662109375, -1.1348876953125, -1.094146728515625, -1.05340576171875, -1.012664794921875, -0.971923828125, -0.931182861328125, -0.89044189453125, -0.849700927734375, -0.8089599609375, -0.768218994140625, -0.72747802734375, -0.686737060546875, -0.64599609375, -0.605255126953125, -0.56451416015625, -0.523773193359375, -0.4830322265625, -0.442291259765625, -0.40155029296875, -0.360809326171875, -0.320068359375, -0.279327392578125, -0.23858642578125, -0.197845458984375, -0.1571044921875, -0.116363525390625, -0.07562255859375, -0.034881591796875, 0.005859375, 0.046600341796875, 0.08734130859375, 0.128082275390625, 0.1688232421875, 0.209564208984375, 0.25030517578125, 0.291046142578125, 0.331787109375, 0.372528076171875, 0.41326904296875, 0.454010009765625, 0.4947509765625, 0.535491943359375, 0.57623291015625, 0.616973876953125, 0.65771484375, 0.698455810546875, 0.73919677734375, 0.779937744140625, 0.8206787109375, 0.861419677734375, 0.90216064453125, 0.942901611328125, 0.983642578125, 1.024383544921875, 1.06512451171875, 1.105865478515625, 1.1466064453125, 1.187347412109375, 1.22808837890625, 1.268829345703125, 1.3095703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 0.0, 6.0, 0.0, 9.0, 6.0, 14.0, 21.0, 42.0, 47.0, 97.0, 165.0, 338.0, 764.0, 1891.0, 5228.0, 17196.0, 78343.0, 558887.0, 320674.0, 46779.0, 11682.0, 3682.0, 1483.0, 581.0, 292.0, 152.0, 66.0, 40.0, 24.0, 23.0, 8.0, 11.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.837890625, -3.713470458984375, -3.58905029296875, -3.464630126953125, -3.3402099609375, -3.215789794921875, -3.09136962890625, -2.966949462890625, -2.842529296875, -2.718109130859375, -2.59368896484375, -2.469268798828125, -2.3448486328125, -2.220428466796875, -2.09600830078125, -1.971588134765625, -1.84716796875, -1.722747802734375, -1.59832763671875, -1.473907470703125, -1.3494873046875, -1.225067138671875, -1.10064697265625, -0.976226806640625, -0.851806640625, -0.727386474609375, -0.60296630859375, -0.478546142578125, -0.3541259765625, -0.229705810546875, -0.10528564453125, 0.019134521484375, 0.1435546875, 0.267974853515625, 0.39239501953125, 0.516815185546875, 0.6412353515625, 0.765655517578125, 0.89007568359375, 1.014495849609375, 1.138916015625, 1.263336181640625, 1.38775634765625, 1.512176513671875, 1.6365966796875, 1.761016845703125, 1.88543701171875, 2.009857177734375, 2.13427734375, 2.258697509765625, 2.38311767578125, 2.507537841796875, 2.6319580078125, 2.756378173828125, 2.88079833984375, 3.005218505859375, 3.129638671875, 3.254058837890625, 3.37847900390625, 3.502899169921875, 3.6273193359375, 3.751739501953125, 3.87615966796875, 4.000579833984375, 4.125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 9.0, 15.0, 11.0, 11.0, 22.0, 24.0, 24.0, 25.0, 37.0, 42.0, 48.0, 52.0, 64.0, 63.0, 64.0, 65.0, 65.0, 46.0, 36.0, 48.0, 50.0, 30.0, 35.0, 21.0, 21.0, 20.0, 11.0, 8.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.50390625, -5.33001708984375, -5.1561279296875, -4.98223876953125, -4.808349609375, -4.63446044921875, -4.4605712890625, -4.28668212890625, -4.11279296875, -3.93890380859375, -3.7650146484375, -3.59112548828125, -3.417236328125, -3.24334716796875, -3.0694580078125, -2.89556884765625, -2.7216796875, -2.54779052734375, -2.3739013671875, -2.20001220703125, -2.026123046875, -1.85223388671875, -1.6783447265625, -1.50445556640625, -1.33056640625, -1.15667724609375, -0.9827880859375, -0.80889892578125, -0.635009765625, -0.46112060546875, -0.2872314453125, -0.11334228515625, 0.060546875, 0.23443603515625, 0.4083251953125, 0.58221435546875, 0.756103515625, 0.92999267578125, 1.1038818359375, 1.27777099609375, 1.45166015625, 1.62554931640625, 1.7994384765625, 1.97332763671875, 2.147216796875, 2.32110595703125, 2.4949951171875, 2.66888427734375, 2.8427734375, 3.01666259765625, 3.1905517578125, 3.36444091796875, 3.538330078125, 3.71221923828125, 3.8861083984375, 4.05999755859375, 4.23388671875, 4.40777587890625, 4.5816650390625, 4.75555419921875, 4.929443359375, 5.10333251953125, 5.2772216796875, 5.45111083984375, 5.625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 3.0, 6.0, 4.0, 4.0, 10.0, 15.0, 13.0, 6.0, 14.0, 31.0, 43.0, 52.0, 91.0, 154.0, 261.0, 488.0, 935.0, 1858.0, 4370.0, 12140.0, 46420.0, 295500.0, 561734.0, 92905.0, 19697.0, 6499.0, 2604.0, 1225.0, 616.0, 328.0, 188.0, 111.0, 59.0, 48.0, 37.0, 27.0, 19.0, 11.0, 7.0, 7.0, 4.0, 2.0, 2.0, 5.0, 7.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.7724609375, -1.72064208984375, -1.6688232421875, -1.61700439453125, -1.565185546875, -1.51336669921875, -1.4615478515625, -1.40972900390625, -1.35791015625, -1.30609130859375, -1.2542724609375, -1.20245361328125, -1.150634765625, -1.09881591796875, -1.0469970703125, -0.99517822265625, -0.943359375, -0.89154052734375, -0.8397216796875, -0.78790283203125, -0.736083984375, -0.68426513671875, -0.6324462890625, -0.58062744140625, -0.52880859375, -0.47698974609375, -0.4251708984375, -0.37335205078125, -0.321533203125, -0.26971435546875, -0.2178955078125, -0.16607666015625, -0.1142578125, -0.06243896484375, -0.0106201171875, 0.04119873046875, 0.093017578125, 0.14483642578125, 0.1966552734375, 0.24847412109375, 0.30029296875, 0.35211181640625, 0.4039306640625, 0.45574951171875, 0.507568359375, 0.55938720703125, 0.6112060546875, 0.66302490234375, 0.71484375, 0.76666259765625, 0.8184814453125, 0.87030029296875, 0.922119140625, 0.97393798828125, 1.0257568359375, 1.07757568359375, 1.12939453125, 1.18121337890625, 1.2330322265625, 1.28485107421875, 1.336669921875, 1.38848876953125, 1.4403076171875, 1.49212646484375, 1.5439453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 3.0, 5.0, 9.0, 7.0, 13.0, 24.0, 43.0, 58.0, 110.0, 169.0, 191.0, 147.0, 86.0, 48.0, 31.0, 23.0, 13.0, 6.0, 2.0, 4.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004870891571044922, -0.00047152116894721985, -0.0004559531807899475, -0.00044038519263267517, -0.00042481720447540283, -0.0004092492163181305, -0.00039368122816085815, -0.0003781132400035858, -0.0003625452518463135, -0.00034697726368904114, -0.0003314092755317688, -0.00031584128737449646, -0.0003002732992172241, -0.0002847053110599518, -0.00026913732290267944, -0.0002535693347454071, -0.00023800134658813477, -0.00022243335843086243, -0.0002068653702735901, -0.00019129738211631775, -0.0001757293939590454, -0.00016016140580177307, -0.00014459341764450073, -0.0001290254294872284, -0.00011345744132995605, -9.788945317268372e-05, -8.232146501541138e-05, -6.675347685813904e-05, -5.11854887008667e-05, -3.561750054359436e-05, -2.004951238632202e-05, -4.481524229049683e-06, 1.1086463928222656e-05, 2.6654452085494995e-05, 4.2222440242767334e-05, 5.779042840003967e-05, 7.335841655731201e-05, 8.892640471458435e-05, 0.00010449439287185669, 0.00012006238102912903, 0.00013563036918640137, 0.0001511983573436737, 0.00016676634550094604, 0.00018233433365821838, 0.00019790232181549072, 0.00021347030997276306, 0.0002290382981300354, 0.00024460628628730774, 0.0002601742744445801, 0.0002757422626018524, 0.00029131025075912476, 0.0003068782389163971, 0.00032244622707366943, 0.00033801421523094177, 0.0003535822033882141, 0.00036915019154548645, 0.0003847181797027588, 0.00040028616786003113, 0.00041585415601730347, 0.0004314221441745758, 0.00044699013233184814, 0.0004625581204891205, 0.0004781261086463928, 0.0004936940968036652, 0.0005092620849609375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 9.0, 13.0, 26.0, 21.0, 31.0, 45.0, 72.0, 121.0, 186.0, 298.0, 516.0, 980.0, 1824.0, 3861.0, 8919.0, 26092.0, 102347.0, 450165.0, 345111.0, 73451.0, 20173.0, 7303.0, 3272.0, 1615.0, 809.0, 486.0, 299.0, 160.0, 117.0, 74.0, 40.0, 27.0, 24.0, 17.0, 13.0, 16.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1279296875, -1.0859832763671875, -1.044036865234375, -1.0020904541015625, -0.96014404296875, -0.9181976318359375, -0.876251220703125, -0.8343048095703125, -0.7923583984375, -0.7504119873046875, -0.708465576171875, -0.6665191650390625, -0.62457275390625, -0.5826263427734375, -0.540679931640625, -0.4987335205078125, -0.456787109375, -0.4148406982421875, -0.372894287109375, -0.3309478759765625, -0.28900146484375, -0.2470550537109375, -0.205108642578125, -0.1631622314453125, -0.1212158203125, -0.0792694091796875, -0.037322998046875, 0.0046234130859375, 0.04656982421875, 0.0885162353515625, 0.130462646484375, 0.1724090576171875, 0.21435546875, 0.2563018798828125, 0.298248291015625, 0.3401947021484375, 0.38214111328125, 0.4240875244140625, 0.466033935546875, 0.5079803466796875, 0.5499267578125, 0.5918731689453125, 0.633819580078125, 0.6757659912109375, 0.71771240234375, 0.7596588134765625, 0.801605224609375, 0.8435516357421875, 0.885498046875, 0.9274444580078125, 0.969390869140625, 1.0113372802734375, 1.05328369140625, 1.0952301025390625, 1.137176513671875, 1.1791229248046875, 1.2210693359375, 1.2630157470703125, 1.304962158203125, 1.3469085693359375, 1.38885498046875, 1.4308013916015625, 1.472747802734375, 1.5146942138671875, 1.556640625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 7.0, 5.0, 8.0, 13.0, 9.0, 21.0, 17.0, 25.0, 39.0, 49.0, 67.0, 60.0, 91.0, 101.0, 94.0, 87.0, 76.0, 60.0, 40.0, 30.0, 20.0, 15.0, 16.0, 10.0, 9.0, 5.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2841796875, -1.236236572265625, -1.18829345703125, -1.140350341796875, -1.0924072265625, -1.044464111328125, -0.99652099609375, -0.948577880859375, -0.900634765625, -0.852691650390625, -0.80474853515625, -0.756805419921875, -0.7088623046875, -0.660919189453125, -0.61297607421875, -0.565032958984375, -0.51708984375, -0.469146728515625, -0.42120361328125, -0.373260498046875, -0.3253173828125, -0.277374267578125, -0.22943115234375, -0.181488037109375, -0.133544921875, -0.085601806640625, -0.03765869140625, 0.010284423828125, 0.0582275390625, 0.106170654296875, 0.15411376953125, 0.202056884765625, 0.25, 0.297943115234375, 0.34588623046875, 0.393829345703125, 0.4417724609375, 0.489715576171875, 0.53765869140625, 0.585601806640625, 0.633544921875, 0.681488037109375, 0.72943115234375, 0.777374267578125, 0.8253173828125, 0.873260498046875, 0.92120361328125, 0.969146728515625, 1.01708984375, 1.065032958984375, 1.11297607421875, 1.160919189453125, 1.2088623046875, 1.256805419921875, 1.30474853515625, 1.352691650390625, 1.400634765625, 1.448577880859375, 1.49652099609375, 1.544464111328125, 1.5924072265625, 1.640350341796875, 1.68829345703125, 1.736236572265625, 1.7841796875]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 9.0, 28.0, 96.0, 270.0, 354.0, 164.0, 67.0, 15.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.778488159179688, -24.61853790283203, -22.458589553833008, -20.29863929748535, -18.138690948486328, -15.978740692138672, -13.818790435791016, -11.658841133117676, -9.498891830444336, -7.338942527770996, -5.178992748260498, -3.01904296875, -0.8590936660766602, 1.3008556365966797, 3.460805892944336, 5.620755195617676, 7.780704498291016, 9.940653800964355, 12.100603103637695, 14.260553359985352, 16.420501708984375, 18.58045196533203, 20.740402221679688, 22.900352478027344, 25.060300827026367, 27.220251083374023, 29.380199432373047, 31.540149688720703, 33.70009994506836, 35.86004638671875, 38.019996643066406, 40.17994689941406, 42.33989715576172, 44.499847412109375, 46.65979766845703, 48.81974792480469, 50.97969436645508, 53.139644622802734, 55.29959487915039, 57.45954513549805, 59.61949157714844, 61.779441833496094, 63.93939208984375, 66.0993423461914, 68.25929260253906, 70.41923522949219, 72.57919311523438, 74.7391357421875, 76.89909362792969, 79.05904388427734, 81.218994140625, 83.37894439697266, 85.53889465332031, 87.69883728027344, 89.85879516601562, 92.01873779296875, 94.1786880493164, 96.33863830566406, 98.49858856201172, 100.65853881835938, 102.81848907470703, 104.97843933105469, 107.13838195800781, 109.29833221435547, 111.45828247070312]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 3.0, 1.0, 2.0, 6.0, 5.0, 10.0, 9.0, 8.0, 11.0, 20.0, 14.0, 22.0, 26.0, 24.0, 33.0, 26.0, 33.0, 27.0, 34.0, 45.0, 42.0, 51.0, 49.0, 40.0, 38.0, 51.0, 54.0, 43.0, 23.0, 33.0, 28.0, 29.0, 25.0, 18.0, 26.0, 19.0, 16.0, 8.0, 8.0, 5.0, 13.0, 7.0, 11.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.867122650146484, -23.07390594482422, -22.280691146850586, -21.48747444152832, -20.694259643554688, -19.901042938232422, -19.10782814025879, -18.314611434936523, -17.52139663696289, -16.728179931640625, -15.934965133666992, -15.141749382019043, -14.348533630371094, -13.555317878723145, -12.762102127075195, -11.96888542175293, -11.17566967010498, -10.382453918457031, -9.589238166809082, -8.796022415161133, -8.002806663513184, -7.209590911865234, -6.416374683380127, -5.623158931732178, -4.8299431800842285, -4.036727428436279, -3.24351167678833, -2.4502956867218018, -1.6570799350738525, -0.8638641834259033, -0.070648193359375, 0.7225675582885742, 1.5157833099365234, 2.3089990615844727, 3.102214813232422, 3.89543080329895, 4.68864631652832, 5.4818620681762695, 6.275078296661377, 7.068294048309326, 7.861509799957275, 8.654726028442383, 9.447941780090332, 10.241157531738281, 11.03437328338623, 11.82758903503418, 12.620804786682129, 13.414020538330078, 14.207236289978027, 15.000452041625977, 15.793667793273926, 16.586883544921875, 17.38010025024414, 18.173315048217773, 18.96653175354004, 19.759746551513672, 20.552963256835938, 21.346179962158203, 22.139394760131836, 22.9326114654541, 23.725826263427734, 24.51904296875, 25.312257766723633, 26.1054744720459, 26.89868927001953]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 7.0, 21.0, 23.0, 31.0, 72.0, 107.0, 204.0, 372.0, 914.0, 4305.0, 4170975.0, 14583.0, 1601.0, 476.0, 253.0, 139.0, 64.0, 46.0, 30.0, 19.0, 21.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0234375, -8.5413818359375, -8.059326171875, -7.5772705078125, -7.09521484375, -6.6131591796875, -6.131103515625, -5.6490478515625, -5.1669921875, -4.6849365234375, -4.202880859375, -3.7208251953125, -3.23876953125, -2.7567138671875, -2.274658203125, -1.7926025390625, -1.310546875, -0.8284912109375, -0.346435546875, 0.1356201171875, 0.61767578125, 1.0997314453125, 1.581787109375, 2.0638427734375, 2.5458984375, 3.0279541015625, 3.510009765625, 3.9920654296875, 4.47412109375, 4.9561767578125, 5.438232421875, 5.9202880859375, 6.40234375, 6.8843994140625, 7.366455078125, 7.8485107421875, 8.33056640625, 8.8126220703125, 9.294677734375, 9.7767333984375, 10.2587890625, 10.7408447265625, 11.222900390625, 11.7049560546875, 12.18701171875, 12.6690673828125, 13.151123046875, 13.6331787109375, 14.115234375, 14.5972900390625, 15.079345703125, 15.5614013671875, 16.04345703125, 16.5255126953125, 17.007568359375, 17.4896240234375, 17.9716796875, 18.4537353515625, 18.935791015625, 19.4178466796875, 19.89990234375, 20.3819580078125, 20.864013671875, 21.3460693359375, 21.828125]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 9.0, 6.0, 5.0, 18.0, 19.0, 18.0, 22.0, 20.0, 25.0, 34.0, 34.0, 26.0, 48.0, 47.0, 43.0, 38.0, 52.0, 61.0, 58.0, 43.0, 63.0, 41.0, 39.0, 42.0, 35.0, 35.0, 22.0, 23.0, 18.0, 12.0, 5.0, 11.0, 3.0, 8.0, 2.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.4853515625, -1.4428558349609375, -1.400360107421875, -1.3578643798828125, -1.31536865234375, -1.2728729248046875, -1.230377197265625, -1.1878814697265625, -1.1453857421875, -1.1028900146484375, -1.060394287109375, -1.0178985595703125, -0.97540283203125, -0.9329071044921875, -0.890411376953125, -0.8479156494140625, -0.805419921875, -0.7629241943359375, -0.720428466796875, -0.6779327392578125, -0.63543701171875, -0.5929412841796875, -0.550445556640625, -0.5079498291015625, -0.4654541015625, -0.4229583740234375, -0.380462646484375, -0.3379669189453125, -0.29547119140625, -0.2529754638671875, -0.210479736328125, -0.1679840087890625, -0.12548828125, -0.0829925537109375, -0.040496826171875, 0.0019989013671875, 0.04449462890625, 0.0869903564453125, 0.129486083984375, 0.1719818115234375, 0.2144775390625, 0.2569732666015625, 0.299468994140625, 0.3419647216796875, 0.38446044921875, 0.4269561767578125, 0.469451904296875, 0.5119476318359375, 0.554443359375, 0.5969390869140625, 0.639434814453125, 0.6819305419921875, 0.72442626953125, 0.7669219970703125, 0.809417724609375, 0.8519134521484375, 0.8944091796875, 0.9369049072265625, 0.979400634765625, 1.0218963623046875, 1.06439208984375, 1.1068878173828125, 1.149383544921875, 1.1918792724609375, 1.234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 7.0, 11.0, 15.0, 19.0, 30.0, 38.0, 48.0, 58.0, 74.0, 88.0, 142.0, 188.0, 282.0, 525.0, 1190.0, 3620.0, 17629.0, 4126952.0, 34619.0, 5373.0, 1759.0, 579.0, 331.0, 178.0, 128.0, 93.0, 87.0, 73.0, 32.0, 18.0, 26.0, 23.0, 20.0, 13.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.06640625, -5.88604736328125, -5.7056884765625, -5.52532958984375, -5.344970703125, -5.16461181640625, -4.9842529296875, -4.80389404296875, -4.62353515625, -4.44317626953125, -4.2628173828125, -4.08245849609375, -3.902099609375, -3.72174072265625, -3.5413818359375, -3.36102294921875, -3.1806640625, -3.00030517578125, -2.8199462890625, -2.63958740234375, -2.459228515625, -2.27886962890625, -2.0985107421875, -1.91815185546875, -1.73779296875, -1.55743408203125, -1.3770751953125, -1.19671630859375, -1.016357421875, -0.83599853515625, -0.6556396484375, -0.47528076171875, -0.294921875, -0.11456298828125, 0.0657958984375, 0.24615478515625, 0.426513671875, 0.60687255859375, 0.7872314453125, 0.96759033203125, 1.14794921875, 1.32830810546875, 1.5086669921875, 1.68902587890625, 1.869384765625, 2.04974365234375, 2.2301025390625, 2.41046142578125, 2.5908203125, 2.77117919921875, 2.9515380859375, 3.13189697265625, 3.312255859375, 3.49261474609375, 3.6729736328125, 3.85333251953125, 4.03369140625, 4.21405029296875, 4.3944091796875, 4.57476806640625, 4.755126953125, 4.93548583984375, 5.1158447265625, 5.29620361328125, 5.4765625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 13.0, 24.0, 148.0, 3751.0, 70.0, 23.0, 12.0, 4.0, 13.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6474609375, -1.6140480041503906, -1.5806350708007812, -1.5472221374511719, -1.5138092041015625, -1.4803962707519531, -1.4469833374023438, -1.4135704040527344, -1.380157470703125, -1.3467445373535156, -1.3133316040039062, -1.2799186706542969, -1.2465057373046875, -1.2130928039550781, -1.1796798706054688, -1.1462669372558594, -1.11285400390625, -1.0794410705566406, -1.0460281372070312, -1.0126152038574219, -0.9792022705078125, -0.9457893371582031, -0.9123764038085938, -0.8789634704589844, -0.845550537109375, -0.8121376037597656, -0.7787246704101562, -0.7453117370605469, -0.7118988037109375, -0.6784858703613281, -0.6450729370117188, -0.6116600036621094, -0.5782470703125, -0.5448341369628906, -0.5114212036132812, -0.4780082702636719, -0.4445953369140625, -0.4111824035644531, -0.37776947021484375, -0.3443565368652344, -0.310943603515625, -0.2775306701660156, -0.24411773681640625, -0.21070480346679688, -0.1772918701171875, -0.14387893676757812, -0.11046600341796875, -0.07705307006835938, -0.04364013671875, -0.010227203369140625, 0.02318572998046875, 0.056598663330078125, 0.0900115966796875, 0.12342453002929688, 0.15683746337890625, 0.19025039672851562, 0.223663330078125, 0.2570762634277344, 0.29048919677734375, 0.3239021301269531, 0.3573150634765625, 0.3907279968261719, 0.42414093017578125, 0.4575538635253906, 0.490966796875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 11.0, 13.0, 24.0, 59.0, 89.0, 165.0, 247.0, 197.0, 117.0, 48.0, 20.0, 12.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.29643440246582, -8.130607604980469, -7.964781284332275, -7.798954486846924, -7.6331281661987305, -7.467301368713379, -7.3014750480651855, -7.135648250579834, -6.969821929931641, -6.803995132446289, -6.638168811798096, -6.472342014312744, -6.306515693664551, -6.140688896179199, -5.974862575531006, -5.809035778045654, -5.643208980560303, -5.477382183074951, -5.311555862426758, -5.145729064941406, -4.979902744293213, -4.814075946807861, -4.648249626159668, -4.482422828674316, -4.316596031188965, -4.150769233703613, -3.98494291305542, -3.8191163539886475, -3.653289794921875, -3.4874629974365234, -3.321636438369751, -3.1558098793029785, -2.989983081817627, -2.8241565227508545, -2.658329963684082, -2.4925034046173096, -2.326676845550537, -2.1608500480651855, -1.995023488998413, -1.8291969299316406, -1.6633703708648682, -1.4975438117980957, -1.3317172527313232, -1.1658905744552612, -1.0000640153884888, -0.8342374563217163, -0.6684108376502991, -0.5025842189788818, -0.3367576599121094, -0.17093107104301453, -0.005104482173919678, 0.16072210669517517, 0.32654869556427, 0.4923752546310425, 0.6582018733024597, 0.824028491973877, 0.9898550510406494, 1.1556816101074219, 1.3215081691741943, 1.4873348474502563, 1.6531614065170288, 1.8189879655838013, 1.9848146438598633, 2.1506412029266357, 2.316467761993408]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 6.0, 3.0, 13.0, 9.0, 8.0, 15.0, 24.0, 14.0, 19.0, 32.0, 29.0, 38.0, 37.0, 40.0, 42.0, 54.0, 38.0, 54.0, 42.0, 46.0, 46.0, 36.0, 46.0, 32.0, 35.0, 37.0, 26.0, 24.0, 22.0, 31.0, 20.0, 17.0, 13.0, 11.0, 9.0, 5.0, 6.0, 7.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7801048755645752, -1.718544363975525, -1.6569838523864746, -1.5954232215881348, -1.5338627099990845, -1.4723021984100342, -1.4107415676116943, -1.349181056022644, -1.2876205444335938, -1.2260600328445435, -1.1644995212554932, -1.1029388904571533, -1.041378378868103, -0.9798178672790527, -0.9182572960853577, -0.8566967248916626, -0.7951362133026123, -0.733575701713562, -0.6720151305198669, -0.6104545593261719, -0.5488940477371216, -0.4873335063457489, -0.4257729649543762, -0.36421242356300354, -0.30265188217163086, -0.24109134078025818, -0.1795307993888855, -0.11797025799751282, -0.05640971660614014, 0.005150824785232544, 0.06671136617660522, 0.1282719075679779, 0.18983244895935059, 0.25139299035072327, 0.31295353174209595, 0.37451407313346863, 0.4360746145248413, 0.497635155916214, 0.5591956973075867, 0.6207562685012817, 0.682316780090332, 0.7438772916793823, 0.8054378628730774, 0.8669984340667725, 0.9285589456558228, 0.990119457244873, 1.051680088043213, 1.1132405996322632, 1.1748011112213135, 1.2363616228103638, 1.297922134399414, 1.359482765197754, 1.4210432767868042, 1.4826037883758545, 1.5441644191741943, 1.6057249307632446, 1.667285442352295, 1.7288459539413452, 1.7904064655303955, 1.8519670963287354, 1.9135276079177856, 1.975088119506836, 2.036648750305176, 2.0982091426849365, 2.1597697734832764]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 13.0, 18.0, 17.0, 25.0, 38.0, 54.0, 88.0, 101.0, 177.0, 369.0, 721.0, 1854.0, 5372.0, 18888.0, 78090.0, 399389.0, 428831.0, 85066.0, 20063.0, 5812.0, 1926.0, 751.0, 339.0, 196.0, 98.0, 70.0, 63.0, 33.0, 25.0, 15.0, 11.0, 12.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-5.453125, -5.3017578125, -5.150390625, -4.9990234375, -4.84765625, -4.6962890625, -4.544921875, -4.3935546875, -4.2421875, -4.0908203125, -3.939453125, -3.7880859375, -3.63671875, -3.4853515625, -3.333984375, -3.1826171875, -3.03125, -2.8798828125, -2.728515625, -2.5771484375, -2.42578125, -2.2744140625, -2.123046875, -1.9716796875, -1.8203125, -1.6689453125, -1.517578125, -1.3662109375, -1.21484375, -1.0634765625, -0.912109375, -0.7607421875, -0.609375, -0.4580078125, -0.306640625, -0.1552734375, -0.00390625, 0.1474609375, 0.298828125, 0.4501953125, 0.6015625, 0.7529296875, 0.904296875, 1.0556640625, 1.20703125, 1.3583984375, 1.509765625, 1.6611328125, 1.8125, 1.9638671875, 2.115234375, 2.2666015625, 2.41796875, 2.5693359375, 2.720703125, 2.8720703125, 3.0234375, 3.1748046875, 3.326171875, 3.4775390625, 3.62890625, 3.7802734375, 3.931640625, 4.0830078125, 4.234375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 9.0, 4.0, 7.0, 6.0, 10.0, 18.0, 20.0, 30.0, 18.0, 22.0, 30.0, 33.0, 42.0, 40.0, 33.0, 40.0, 49.0, 60.0, 49.0, 59.0, 59.0, 52.0, 56.0, 41.0, 32.0, 41.0, 30.0, 28.0, 19.0, 23.0, 11.0, 8.0, 4.0, 5.0, 7.0, 5.0, 1.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.7529296875, -1.70465087890625, -1.6563720703125, -1.60809326171875, -1.559814453125, -1.51153564453125, -1.4632568359375, -1.41497802734375, -1.36669921875, -1.31842041015625, -1.2701416015625, -1.22186279296875, -1.173583984375, -1.12530517578125, -1.0770263671875, -1.02874755859375, -0.98046875, -0.93218994140625, -0.8839111328125, -0.83563232421875, -0.787353515625, -0.73907470703125, -0.6907958984375, -0.64251708984375, -0.59423828125, -0.54595947265625, -0.4976806640625, -0.44940185546875, -0.401123046875, -0.35284423828125, -0.3045654296875, -0.25628662109375, -0.2080078125, -0.15972900390625, -0.1114501953125, -0.06317138671875, -0.014892578125, 0.03338623046875, 0.0816650390625, 0.12994384765625, 0.17822265625, 0.22650146484375, 0.2747802734375, 0.32305908203125, 0.371337890625, 0.41961669921875, 0.4678955078125, 0.51617431640625, 0.564453125, 0.61273193359375, 0.6610107421875, 0.70928955078125, 0.757568359375, 0.80584716796875, 0.8541259765625, 0.90240478515625, 0.95068359375, 0.99896240234375, 1.0472412109375, 1.09552001953125, 1.143798828125, 1.19207763671875, 1.2403564453125, 1.28863525390625, 1.3369140625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 11.0, 9.0, 26.0, 49.0, 77.0, 219.0, 698.0, 3012.0, 29505.0, 804678.0, 198286.0, 9875.0, 1417.0, 408.0, 134.0, 72.0, 31.0, 24.0, 11.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.7237548828125, -10.424072265625, -10.1243896484375, -9.82470703125, -9.5250244140625, -9.225341796875, -8.9256591796875, -8.6259765625, -8.3262939453125, -8.026611328125, -7.7269287109375, -7.42724609375, -7.1275634765625, -6.827880859375, -6.5281982421875, -6.228515625, -5.9288330078125, -5.629150390625, -5.3294677734375, -5.02978515625, -4.7301025390625, -4.430419921875, -4.1307373046875, -3.8310546875, -3.5313720703125, -3.231689453125, -2.9320068359375, -2.63232421875, -2.3326416015625, -2.032958984375, -1.7332763671875, -1.43359375, -1.1339111328125, -0.834228515625, -0.5345458984375, -0.23486328125, 0.0648193359375, 0.364501953125, 0.6641845703125, 0.9638671875, 1.2635498046875, 1.563232421875, 1.8629150390625, 2.16259765625, 2.4622802734375, 2.761962890625, 3.0616455078125, 3.361328125, 3.6610107421875, 3.960693359375, 4.2603759765625, 4.56005859375, 4.8597412109375, 5.159423828125, 5.4591064453125, 5.7587890625, 6.0584716796875, 6.358154296875, 6.6578369140625, 6.95751953125, 7.2572021484375, 7.556884765625, 7.8565673828125, 8.15625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 7.0, 14.0, 10.0, 24.0, 37.0, 31.0, 56.0, 83.0, 65.0, 94.0, 109.0, 83.0, 81.0, 65.0, 73.0, 53.0, 34.0, 25.0, 18.0, 19.0, 8.0, 8.0, 5.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.26708984375, -6.8779296875, -6.48876953125, -6.099609375, -5.71044921875, -5.3212890625, -4.93212890625, -4.54296875, -4.15380859375, -3.7646484375, -3.37548828125, -2.986328125, -2.59716796875, -2.2080078125, -1.81884765625, -1.4296875, -1.04052734375, -0.6513671875, -0.26220703125, 0.126953125, 0.51611328125, 0.9052734375, 1.29443359375, 1.68359375, 2.07275390625, 2.4619140625, 2.85107421875, 3.240234375, 3.62939453125, 4.0185546875, 4.40771484375, 4.796875, 5.18603515625, 5.5751953125, 5.96435546875, 6.353515625, 6.74267578125, 7.1318359375, 7.52099609375, 7.91015625, 8.29931640625, 8.6884765625, 9.07763671875, 9.466796875, 9.85595703125, 10.2451171875, 10.63427734375, 11.0234375, 11.41259765625, 11.8017578125, 12.19091796875, 12.580078125, 12.96923828125, 13.3583984375, 13.74755859375, 14.13671875, 14.52587890625, 14.9150390625, 15.30419921875, 15.693359375, 16.08251953125, 16.4716796875, 16.86083984375, 17.25]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 25.0, 54.0, 112.0, 302.0, 1110.0, 14573.0, 1027159.0, 4200.0, 629.0, 232.0, 84.0, 25.0, 18.0, 11.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.9453125, -15.4014892578125, -14.857666015625, -14.3138427734375, -13.77001953125, -13.2261962890625, -12.682373046875, -12.1385498046875, -11.5947265625, -11.0509033203125, -10.507080078125, -9.9632568359375, -9.41943359375, -8.8756103515625, -8.331787109375, -7.7879638671875, -7.244140625, -6.7003173828125, -6.156494140625, -5.6126708984375, -5.06884765625, -4.5250244140625, -3.981201171875, -3.4373779296875, -2.8935546875, -2.3497314453125, -1.805908203125, -1.2620849609375, -0.71826171875, -0.1744384765625, 0.369384765625, 0.9132080078125, 1.45703125, 2.0008544921875, 2.544677734375, 3.0885009765625, 3.63232421875, 4.1761474609375, 4.719970703125, 5.2637939453125, 5.8076171875, 6.3514404296875, 6.895263671875, 7.4390869140625, 7.98291015625, 8.5267333984375, 9.070556640625, 9.6143798828125, 10.158203125, 10.7020263671875, 11.245849609375, 11.7896728515625, 12.33349609375, 12.8773193359375, 13.421142578125, 13.9649658203125, 14.5087890625, 15.0526123046875, 15.596435546875, 16.1402587890625, 16.68408203125, 17.2279052734375, 17.771728515625, 18.3155517578125, 18.859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 12.0, 28.0, 88.0, 218.0, 331.0, 195.0, 64.0, 35.0, 15.0, 7.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0004241466522216797, -0.00039479508996009827, -0.00036544352769851685, -0.0003360919654369354, -0.000306740403175354, -0.0002773888409137726, -0.00024803727865219116, -0.00021868571639060974, -0.00018933415412902832, -0.0001599825918674469, -0.00013063102960586548, -0.00010127946734428406, -7.192790508270264e-05, -4.2576342821121216e-05, -1.3224780559539795e-05, 1.6126781702041626e-05, 4.547834396362305e-05, 7.482990622520447e-05, 0.00010418146848678589, 0.0001335330307483673, 0.00016288459300994873, 0.00019223615527153015, 0.00022158771753311157, 0.000250939279794693, 0.0002802908420562744, 0.00030964240431785583, 0.00033899396657943726, 0.0003683455288410187, 0.0003976970911026001, 0.0004270486533641815, 0.00045640021562576294, 0.00048575177788734436, 0.0005151033401489258, 0.0005444549024105072, 0.0005738064646720886, 0.00060315802693367, 0.0006325095891952515, 0.0006618611514568329, 0.0006912127137184143, 0.0007205642759799957, 0.0007499158382415771, 0.0007792674005031586, 0.00080861896276474, 0.0008379705250263214, 0.0008673220872879028, 0.0008966736495494843, 0.0009260252118110657, 0.0009553767740726471, 0.0009847283363342285, 0.00101407989859581, 0.0010434314608573914, 0.0010727830231189728, 0.0011021345853805542, 0.0011314861476421356, 0.001160837709903717, 0.0011901892721652985, 0.0012195408344268799, 0.0012488923966884613, 0.0012782439589500427, 0.0013075955212116241, 0.0013369470834732056, 0.001366298645734787, 0.0013956502079963684, 0.0014250017702579498, 0.0014543533325195312]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 10.0, 12.0, 15.0, 23.0, 22.0, 34.0, 60.0, 71.0, 86.0, 121.0, 179.0, 276.0, 388.0, 635.0, 1082.0, 1780.0, 3652.0, 9505.0, 44639.0, 685402.0, 264363.0, 22988.0, 6392.0, 2773.0, 1451.0, 876.0, 563.0, 329.0, 231.0, 153.0, 125.0, 76.0, 76.0, 41.0, 29.0, 26.0, 17.0, 12.0, 6.0, 12.0, 7.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.79296875, -2.7052001953125, -2.617431640625, -2.5296630859375, -2.44189453125, -2.3541259765625, -2.266357421875, -2.1785888671875, -2.0908203125, -2.0030517578125, -1.915283203125, -1.8275146484375, -1.73974609375, -1.6519775390625, -1.564208984375, -1.4764404296875, -1.388671875, -1.3009033203125, -1.213134765625, -1.1253662109375, -1.03759765625, -0.9498291015625, -0.862060546875, -0.7742919921875, -0.6865234375, -0.5987548828125, -0.510986328125, -0.4232177734375, -0.33544921875, -0.2476806640625, -0.159912109375, -0.0721435546875, 0.015625, 0.1033935546875, 0.191162109375, 0.2789306640625, 0.36669921875, 0.4544677734375, 0.542236328125, 0.6300048828125, 0.7177734375, 0.8055419921875, 0.893310546875, 0.9810791015625, 1.06884765625, 1.1566162109375, 1.244384765625, 1.3321533203125, 1.419921875, 1.5076904296875, 1.595458984375, 1.6832275390625, 1.77099609375, 1.8587646484375, 1.946533203125, 2.0343017578125, 2.1220703125, 2.2098388671875, 2.297607421875, 2.3853759765625, 2.47314453125, 2.5609130859375, 2.648681640625, 2.7364501953125, 2.82421875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 4.0, 3.0, 9.0, 12.0, 28.0, 109.0, 375.0, 304.0, 92.0, 30.0, 12.0, 5.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.140625, -8.863037109375, -8.58544921875, -8.307861328125, -8.0302734375, -7.752685546875, -7.47509765625, -7.197509765625, -6.919921875, -6.642333984375, -6.36474609375, -6.087158203125, -5.8095703125, -5.531982421875, -5.25439453125, -4.976806640625, -4.69921875, -4.421630859375, -4.14404296875, -3.866455078125, -3.5888671875, -3.311279296875, -3.03369140625, -2.756103515625, -2.478515625, -2.200927734375, -1.92333984375, -1.645751953125, -1.3681640625, -1.090576171875, -0.81298828125, -0.535400390625, -0.2578125, 0.019775390625, 0.29736328125, 0.574951171875, 0.8525390625, 1.130126953125, 1.40771484375, 1.685302734375, 1.962890625, 2.240478515625, 2.51806640625, 2.795654296875, 3.0732421875, 3.350830078125, 3.62841796875, 3.906005859375, 4.18359375, 4.461181640625, 4.73876953125, 5.016357421875, 5.2939453125, 5.571533203125, 5.84912109375, 6.126708984375, 6.404296875, 6.681884765625, 6.95947265625, 7.237060546875, 7.5146484375, 7.792236328125, 8.06982421875, 8.347412109375, 8.625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 13.0, 25.0, 77.0, 173.0, 233.0, 222.0, 121.0, 64.0, 35.0, 19.0, 8.0, 3.0, 6.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.80406951904297, -26.681297302246094, -24.55852508544922, -22.435752868652344, -20.31298065185547, -18.190208435058594, -16.06743621826172, -13.944664001464844, -11.821891784667969, -9.699119567871094, -7.576347351074219, -5.453575134277344, -3.3308029174804688, -1.2080307006835938, 0.9147415161132812, 3.0375137329101562, 5.160285949707031, 7.283058166503906, 9.405830383300781, 11.528602600097656, 13.651374816894531, 15.774147033691406, 17.89691925048828, 20.019691467285156, 22.14246368408203, 24.265235900878906, 26.38800811767578, 28.510780334472656, 30.63355255126953, 32.756324768066406, 34.87909698486328, 37.001869201660156, 39.12464141845703, 41.247413635253906, 43.37018585205078, 45.492958068847656, 47.61573028564453, 49.738502502441406, 51.86127471923828, 53.984046936035156, 56.10681915283203, 58.229591369628906, 60.35236358642578, 62.475135803222656, 64.59790802001953, 66.7206802368164, 68.84345245361328, 70.96622467041016, 73.08899688720703, 75.2117691040039, 77.33454132080078, 79.45731353759766, 81.58008575439453, 83.7028579711914, 85.82563018798828, 87.94840240478516, 90.07117462158203, 92.1939468383789, 94.31671905517578, 96.43949127197266, 98.56226348876953, 100.6850357055664, 102.80780792236328, 104.93058013916016, 107.05335235595703]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 10.0, 8.0, 7.0, 10.0, 12.0, 28.0, 12.0, 26.0, 27.0, 40.0, 35.0, 36.0, 50.0, 46.0, 49.0, 63.0, 54.0, 64.0, 43.0, 47.0, 36.0, 42.0, 42.0, 30.0, 32.0, 30.0, 25.0, 17.0, 16.0, 18.0, 11.0, 8.0, 3.0, 5.0, 2.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-43.743247985839844, -42.58384704589844, -41.4244499206543, -40.26504898071289, -39.10565185546875, -37.946250915527344, -36.7868537902832, -35.6274528503418, -34.468055725097656, -33.30865478515625, -32.14925765991211, -30.989858627319336, -29.830459594726562, -28.67106056213379, -27.511661529541016, -26.35226058959961, -25.192861557006836, -24.033462524414062, -22.87406349182129, -21.714664459228516, -20.555265426635742, -19.39586639404297, -18.236465454101562, -17.077068328857422, -15.917668342590332, -14.758269309997559, -13.598870277404785, -12.439470291137695, -11.280071258544922, -10.120672225952148, -8.961273193359375, -7.801874160766602, -6.642473220825195, -5.483074188232422, -4.323675155639648, -3.164275646209717, -2.0048766136169434, -0.8454775810241699, 0.3139219284057617, 1.4733209609985352, 2.6327199935913086, 3.792119026184082, 4.9515180587768555, 6.110917568206787, 7.2703166007995605, 8.429716110229492, 9.589115142822266, 10.748514175415039, 11.907913208007812, 13.067312240600586, 14.22671127319336, 15.386110305786133, 16.545509338378906, 17.70490837097168, 18.864307403564453, 20.02370834350586, 21.18310546875, 22.342504501342773, 23.501903533935547, 24.66130256652832, 25.820701599121094, 26.980100631713867, 28.13949966430664, 29.298900604248047, 30.45829963684082]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 1.0, 0.0, 5.0, 6.0, 10.0, 15.0, 20.0, 28.0, 54.0, 118.0, 225.0, 567.0, 1343.0, 4465.0, 27012.0, 4142904.0, 12962.0, 2851.0, 974.0, 368.0, 177.0, 79.0, 25.0, 22.0, 17.0, 14.0, 5.0, 7.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6015625, -7.1871337890625, -6.772705078125, -6.3582763671875, -5.94384765625, -5.5294189453125, -5.114990234375, -4.7005615234375, -4.2861328125, -3.8717041015625, -3.457275390625, -3.0428466796875, -2.62841796875, -2.2139892578125, -1.799560546875, -1.3851318359375, -0.970703125, -0.5562744140625, -0.141845703125, 0.2725830078125, 0.68701171875, 1.1014404296875, 1.515869140625, 1.9302978515625, 2.3447265625, 2.7591552734375, 3.173583984375, 3.5880126953125, 4.00244140625, 4.4168701171875, 4.831298828125, 5.2457275390625, 5.66015625, 6.0745849609375, 6.489013671875, 6.9034423828125, 7.31787109375, 7.7322998046875, 8.146728515625, 8.5611572265625, 8.9755859375, 9.3900146484375, 9.804443359375, 10.2188720703125, 10.63330078125, 11.0477294921875, 11.462158203125, 11.8765869140625, 12.291015625, 12.7054443359375, 13.119873046875, 13.5343017578125, 13.94873046875, 14.3631591796875, 14.777587890625, 15.1920166015625, 15.6064453125, 16.0208740234375, 16.435302734375, 16.8497314453125, 17.26416015625, 17.6785888671875, 18.093017578125, 18.5074462890625, 18.921875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 12.0, 19.0, 24.0, 33.0, 29.0, 47.0, 56.0, 64.0, 53.0, 71.0, 74.0, 83.0, 61.0, 73.0, 56.0, 43.0, 44.0, 36.0, 30.0, 14.0, 15.0, 11.0, 9.0, 7.0, 5.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.740234375, -2.6728973388671875, -2.605560302734375, -2.5382232666015625, -2.47088623046875, -2.4035491943359375, -2.336212158203125, -2.2688751220703125, -2.2015380859375, -2.1342010498046875, -2.066864013671875, -1.9995269775390625, -1.93218994140625, -1.8648529052734375, -1.797515869140625, -1.7301788330078125, -1.662841796875, -1.5955047607421875, -1.528167724609375, -1.4608306884765625, -1.39349365234375, -1.3261566162109375, -1.258819580078125, -1.1914825439453125, -1.1241455078125, -1.0568084716796875, -0.989471435546875, -0.9221343994140625, -0.85479736328125, -0.7874603271484375, -0.720123291015625, -0.6527862548828125, -0.58544921875, -0.5181121826171875, -0.450775146484375, -0.3834381103515625, -0.31610107421875, -0.2487640380859375, -0.181427001953125, -0.1140899658203125, -0.0467529296875, 0.0205841064453125, 0.087921142578125, 0.1552581787109375, 0.22259521484375, 0.2899322509765625, 0.357269287109375, 0.4246063232421875, 0.491943359375, 0.5592803955078125, 0.626617431640625, 0.6939544677734375, 0.76129150390625, 0.8286285400390625, 0.895965576171875, 0.9633026123046875, 1.0306396484375, 1.0979766845703125, 1.165313720703125, 1.2326507568359375, 1.29998779296875, 1.3673248291015625, 1.434661865234375, 1.5019989013671875, 1.5693359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 10.0, 11.0, 15.0, 17.0, 19.0, 24.0, 48.0, 58.0, 110.0, 126.0, 182.0, 291.0, 460.0, 712.0, 1323.0, 2727.0, 6254.0, 21058.0, 3990273.0, 145870.0, 14353.0, 5013.0, 2225.0, 1133.0, 697.0, 424.0, 285.0, 172.0, 123.0, 90.0, 60.0, 38.0, 20.0, 19.0, 13.0, 11.0, 10.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.20703125, -6.0181884765625, -5.829345703125, -5.6405029296875, -5.45166015625, -5.2628173828125, -5.073974609375, -4.8851318359375, -4.6962890625, -4.5074462890625, -4.318603515625, -4.1297607421875, -3.94091796875, -3.7520751953125, -3.563232421875, -3.3743896484375, -3.185546875, -2.9967041015625, -2.807861328125, -2.6190185546875, -2.43017578125, -2.2413330078125, -2.052490234375, -1.8636474609375, -1.6748046875, -1.4859619140625, -1.297119140625, -1.1082763671875, -0.91943359375, -0.7305908203125, -0.541748046875, -0.3529052734375, -0.1640625, 0.0247802734375, 0.213623046875, 0.4024658203125, 0.59130859375, 0.7801513671875, 0.968994140625, 1.1578369140625, 1.3466796875, 1.5355224609375, 1.724365234375, 1.9132080078125, 2.10205078125, 2.2908935546875, 2.479736328125, 2.6685791015625, 2.857421875, 3.0462646484375, 3.235107421875, 3.4239501953125, 3.61279296875, 3.8016357421875, 3.990478515625, 4.1793212890625, 4.3681640625, 4.5570068359375, 4.745849609375, 4.9346923828125, 5.12353515625, 5.3123779296875, 5.501220703125, 5.6900634765625, 5.87890625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 11.0, 14.0, 21.0, 37.0, 258.0, 3572.0, 77.0, 25.0, 14.0, 13.0, 10.0, 6.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.34375, -2.290679931640625, -2.23760986328125, -2.184539794921875, -2.1314697265625, -2.078399658203125, -2.02532958984375, -1.972259521484375, -1.919189453125, -1.866119384765625, -1.81304931640625, -1.759979248046875, -1.7069091796875, -1.653839111328125, -1.60076904296875, -1.547698974609375, -1.49462890625, -1.441558837890625, -1.38848876953125, -1.335418701171875, -1.2823486328125, -1.229278564453125, -1.17620849609375, -1.123138427734375, -1.070068359375, -1.016998291015625, -0.96392822265625, -0.910858154296875, -0.8577880859375, -0.804718017578125, -0.75164794921875, -0.698577880859375, -0.6455078125, -0.592437744140625, -0.53936767578125, -0.486297607421875, -0.4332275390625, -0.380157470703125, -0.32708740234375, -0.274017333984375, -0.220947265625, -0.167877197265625, -0.11480712890625, -0.061737060546875, -0.0086669921875, 0.044403076171875, 0.09747314453125, 0.150543212890625, 0.20361328125, 0.256683349609375, 0.30975341796875, 0.362823486328125, 0.4158935546875, 0.468963623046875, 0.52203369140625, 0.575103759765625, 0.628173828125, 0.681243896484375, 0.73431396484375, 0.787384033203125, 0.8404541015625, 0.893524169921875, 0.94659423828125, 0.999664306640625, 1.052734375]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 13.0, 17.0, 54.0, 99.0, 218.0, 293.0, 180.0, 79.0, 28.0, 8.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.700613975524902, -14.370037078857422, -14.039459228515625, -13.708882331848145, -13.378305435180664, -13.047727584838867, -12.717150688171387, -12.386573791503906, -12.05599594116211, -11.725419044494629, -11.394841194152832, -11.064264297485352, -10.733686447143555, -10.403109550476074, -10.072532653808594, -9.741954803466797, -9.411377906799316, -9.080801010131836, -8.750223159790039, -8.419646263122559, -8.089069366455078, -7.758491516113281, -7.427914619445801, -7.097337245941162, -6.766759872436523, -6.436182498931885, -6.105605125427246, -5.775028228759766, -5.444450855255127, -5.113873481750488, -4.783296585083008, -4.452719211578369, -4.122142791748047, -3.791565418243408, -3.4609882831573486, -3.130411148071289, -2.7998337745666504, -2.4692564010620117, -2.138679265975952, -1.8081021308898926, -1.477524757385254, -1.1469475030899048, -0.8163702487945557, -0.48579299449920654, -0.15521574020385742, 0.1753615140914917, 0.5059387683868408, 0.8365159034729004, 1.167093276977539, 1.4976705312728882, 1.8282477855682373, 2.158824920654297, 2.4894022941589355, 2.819979667663574, 3.150556802749634, 3.4811339378356934, 3.811711311340332, 4.142288684844971, 4.472866058349609, 4.80344295501709, 5.1340203285217285, 5.464597702026367, 5.795174598693848, 6.125751972198486, 6.456329345703125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 11.0, 10.0, 12.0, 18.0, 17.0, 25.0, 19.0, 22.0, 27.0, 31.0, 37.0, 43.0, 37.0, 44.0, 46.0, 35.0, 32.0, 54.0, 45.0, 44.0, 38.0, 37.0, 53.0, 47.0, 38.0, 29.0, 24.0, 18.0, 22.0, 12.0, 11.0, 9.0, 8.0, 11.0, 4.0, 10.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-3.0633294582366943, -2.976255416870117, -2.88918137550354, -2.802107334136963, -2.7150330543518066, -2.6279590129852295, -2.5408849716186523, -2.453810930252075, -2.366736888885498, -2.279662847518921, -2.1925888061523438, -2.1055145263671875, -2.0184404850006104, -1.9313664436340332, -1.844292402267456, -1.757218360900879, -1.6701440811157227, -1.5830700397491455, -1.4959958791732788, -1.4089218378067017, -1.321847677230835, -1.2347736358642578, -1.1476995944976807, -1.0606255531311035, -0.9735513925552368, -0.8864772915840149, -0.799403190612793, -0.7123291492462158, -0.6252550482749939, -0.538180947303772, -0.4511069059371948, -0.3640328049659729, -0.2769589424133301, -0.18988485634326935, -0.10281077027320862, -0.015736699104309082, 0.07133740186691284, 0.15841150283813477, 0.24548554420471191, 0.33255964517593384, 0.41963374614715576, 0.5067078471183777, 0.5937819480895996, 0.6808559894561768, 0.7679300904273987, 0.8550041913986206, 0.9420782327651978, 1.0291523933410645, 1.1162264347076416, 1.2033004760742188, 1.2903746366500854, 1.3774486780166626, 1.4645228385925293, 1.5515968799591064, 1.6386709213256836, 1.7257449626922607, 1.8128191232681274, 1.8998931646347046, 1.9869673252105713, 2.0740413665771484, 2.1611154079437256, 2.2481894493103027, 2.335263729095459, 2.422337770462036, 2.5094118118286133]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 9.0, 16.0, 9.0, 21.0, 29.0, 45.0, 79.0, 88.0, 188.0, 356.0, 693.0, 1348.0, 2841.0, 6413.0, 15709.0, 43207.0, 134877.0, 396947.0, 301405.0, 92377.0, 30781.0, 11803.0, 4758.0, 2175.0, 1080.0, 561.0, 300.0, 159.0, 87.0, 49.0, 51.0, 31.0, 18.0, 13.0, 9.0, 7.0, 7.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.986328125, -2.882781982421875, -2.77923583984375, -2.675689697265625, -2.5721435546875, -2.468597412109375, -2.36505126953125, -2.261505126953125, -2.157958984375, -2.054412841796875, -1.95086669921875, -1.847320556640625, -1.7437744140625, -1.640228271484375, -1.53668212890625, -1.433135986328125, -1.32958984375, -1.226043701171875, -1.12249755859375, -1.018951416015625, -0.9154052734375, -0.811859130859375, -0.70831298828125, -0.604766845703125, -0.501220703125, -0.397674560546875, -0.29412841796875, -0.190582275390625, -0.0870361328125, 0.016510009765625, 0.12005615234375, 0.223602294921875, 0.3271484375, 0.430694580078125, 0.53424072265625, 0.637786865234375, 0.7413330078125, 0.844879150390625, 0.94842529296875, 1.051971435546875, 1.155517578125, 1.259063720703125, 1.36260986328125, 1.466156005859375, 1.5697021484375, 1.673248291015625, 1.77679443359375, 1.880340576171875, 1.98388671875, 2.087432861328125, 2.19097900390625, 2.294525146484375, 2.3980712890625, 2.501617431640625, 2.60516357421875, 2.708709716796875, 2.812255859375, 2.915802001953125, 3.01934814453125, 3.122894287109375, 3.2264404296875, 3.329986572265625, 3.43353271484375, 3.537078857421875, 3.640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 1.0, 2.0, 4.0, 6.0, 6.0, 11.0, 15.0, 18.0, 22.0, 35.0, 35.0, 48.0, 45.0, 39.0, 42.0, 50.0, 65.0, 56.0, 76.0, 70.0, 61.0, 50.0, 45.0, 40.0, 40.0, 27.0, 18.0, 17.0, 11.0, 11.0, 8.0, 8.0, 8.0, 5.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-2.572265625, -2.510101318359375, -2.44793701171875, -2.385772705078125, -2.3236083984375, -2.261444091796875, -2.19927978515625, -2.137115478515625, -2.074951171875, -2.012786865234375, -1.95062255859375, -1.888458251953125, -1.8262939453125, -1.764129638671875, -1.70196533203125, -1.639801025390625, -1.57763671875, -1.515472412109375, -1.45330810546875, -1.391143798828125, -1.3289794921875, -1.266815185546875, -1.20465087890625, -1.142486572265625, -1.080322265625, -1.018157958984375, -0.95599365234375, -0.893829345703125, -0.8316650390625, -0.769500732421875, -0.70733642578125, -0.645172119140625, -0.5830078125, -0.520843505859375, -0.45867919921875, -0.396514892578125, -0.3343505859375, -0.272186279296875, -0.21002197265625, -0.147857666015625, -0.085693359375, -0.023529052734375, 0.03863525390625, 0.100799560546875, 0.1629638671875, 0.225128173828125, 0.28729248046875, 0.349456787109375, 0.41162109375, 0.473785400390625, 0.53594970703125, 0.598114013671875, 0.6602783203125, 0.722442626953125, 0.78460693359375, 0.846771240234375, 0.908935546875, 0.971099853515625, 1.03326416015625, 1.095428466796875, 1.1575927734375, 1.219757080078125, 1.28192138671875, 1.344085693359375, 1.40625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 10.0, 8.0, 17.0, 50.0, 75.0, 169.0, 323.0, 768.0, 2269.0, 8826.0, 67857.0, 824031.0, 126612.0, 12906.0, 2964.0, 925.0, 374.0, 143.0, 80.0, 41.0, 23.0, 20.0, 14.0, 13.0, 8.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.77789306640625, -8.5167236328125, -8.25555419921875, -7.994384765625, -7.73321533203125, -7.4720458984375, -7.21087646484375, -6.94970703125, -6.68853759765625, -6.4273681640625, -6.16619873046875, -5.905029296875, -5.64385986328125, -5.3826904296875, -5.12152099609375, -4.8603515625, -4.59918212890625, -4.3380126953125, -4.07684326171875, -3.815673828125, -3.55450439453125, -3.2933349609375, -3.03216552734375, -2.77099609375, -2.50982666015625, -2.2486572265625, -1.98748779296875, -1.726318359375, -1.46514892578125, -1.2039794921875, -0.94281005859375, -0.681640625, -0.42047119140625, -0.1593017578125, 0.10186767578125, 0.363037109375, 0.62420654296875, 0.8853759765625, 1.14654541015625, 1.40771484375, 1.66888427734375, 1.9300537109375, 2.19122314453125, 2.452392578125, 2.71356201171875, 2.9747314453125, 3.23590087890625, 3.4970703125, 3.75823974609375, 4.0194091796875, 4.28057861328125, 4.541748046875, 4.80291748046875, 5.0640869140625, 5.32525634765625, 5.58642578125, 5.84759521484375, 6.1087646484375, 6.36993408203125, 6.631103515625, 6.89227294921875, 7.1534423828125, 7.41461181640625, 7.67578125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 4.0, 3.0, 1.0, 14.0, 10.0, 11.0, 20.0, 22.0, 24.0, 16.0, 29.0, 31.0, 31.0, 56.0, 37.0, 55.0, 44.0, 47.0, 55.0, 51.0, 43.0, 51.0, 51.0, 45.0, 43.0, 37.0, 21.0, 32.0, 20.0, 13.0, 14.0, 12.0, 15.0, 8.0, 9.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-8.09375, -7.854736328125, -7.61572265625, -7.376708984375, -7.1376953125, -6.898681640625, -6.65966796875, -6.420654296875, -6.181640625, -5.942626953125, -5.70361328125, -5.464599609375, -5.2255859375, -4.986572265625, -4.74755859375, -4.508544921875, -4.26953125, -4.030517578125, -3.79150390625, -3.552490234375, -3.3134765625, -3.074462890625, -2.83544921875, -2.596435546875, -2.357421875, -2.118408203125, -1.87939453125, -1.640380859375, -1.4013671875, -1.162353515625, -0.92333984375, -0.684326171875, -0.4453125, -0.206298828125, 0.03271484375, 0.271728515625, 0.5107421875, 0.749755859375, 0.98876953125, 1.227783203125, 1.466796875, 1.705810546875, 1.94482421875, 2.183837890625, 2.4228515625, 2.661865234375, 2.90087890625, 3.139892578125, 3.37890625, 3.617919921875, 3.85693359375, 4.095947265625, 4.3349609375, 4.573974609375, 4.81298828125, 5.052001953125, 5.291015625, 5.530029296875, 5.76904296875, 6.008056640625, 6.2470703125, 6.486083984375, 6.72509765625, 6.964111328125, 7.203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 6.0, 9.0, 16.0, 12.0, 19.0, 32.0, 76.0, 110.0, 223.0, 438.0, 1204.0, 3566.0, 16731.0, 325710.0, 669798.0, 23471.0, 4580.0, 1412.0, 549.0, 242.0, 121.0, 78.0, 63.0, 29.0, 22.0, 11.0, 6.0, 3.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.046875, -3.912353515625, -3.77783203125, -3.643310546875, -3.5087890625, -3.374267578125, -3.23974609375, -3.105224609375, -2.970703125, -2.836181640625, -2.70166015625, -2.567138671875, -2.4326171875, -2.298095703125, -2.16357421875, -2.029052734375, -1.89453125, -1.760009765625, -1.62548828125, -1.490966796875, -1.3564453125, -1.221923828125, -1.08740234375, -0.952880859375, -0.818359375, -0.683837890625, -0.54931640625, -0.414794921875, -0.2802734375, -0.145751953125, -0.01123046875, 0.123291015625, 0.2578125, 0.392333984375, 0.52685546875, 0.661376953125, 0.7958984375, 0.930419921875, 1.06494140625, 1.199462890625, 1.333984375, 1.468505859375, 1.60302734375, 1.737548828125, 1.8720703125, 2.006591796875, 2.14111328125, 2.275634765625, 2.41015625, 2.544677734375, 2.67919921875, 2.813720703125, 2.9482421875, 3.082763671875, 3.21728515625, 3.351806640625, 3.486328125, 3.620849609375, 3.75537109375, 3.889892578125, 4.0244140625, 4.158935546875, 4.29345703125, 4.427978515625, 4.5625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 3.0, 4.0, 14.0, 23.0, 39.0, 73.0, 165.0, 316.0, 199.0, 80.0, 39.0, 21.0, 15.0, 8.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011072158813476562, -0.0010760799050331116, -0.001044943928718567, -0.0010138079524040222, -0.0009826719760894775, -0.0009515359997749329, -0.0009204000234603882, -0.0008892640471458435, -0.0008581280708312988, -0.0008269920945167542, -0.0007958561182022095, -0.0007647201418876648, -0.0007335841655731201, -0.0007024481892585754, -0.0006713122129440308, -0.0006401762366294861, -0.0006090402603149414, -0.0005779042840003967, -0.000546768307685852, -0.0005156323313713074, -0.0004844963550567627, -0.000453360378742218, -0.00042222440242767334, -0.00039108842611312866, -0.000359952449798584, -0.0003288164734840393, -0.00029768049716949463, -0.00026654452085494995, -0.00023540854454040527, -0.0002042725682258606, -0.00017313659191131592, -0.00014200061559677124, -0.00011086463928222656, -7.972866296768188e-05, -4.859268665313721e-05, -1.745671033859253e-05, 1.3679265975952148e-05, 4.4815242290496826e-05, 7.59512186050415e-05, 0.00010708719491958618, 0.00013822317123413086, 0.00016935914754867554, 0.00020049512386322021, 0.0002316311001777649, 0.00026276707649230957, 0.00029390305280685425, 0.0003250390291213989, 0.0003561750054359436, 0.0003873109817504883, 0.00041844695806503296, 0.00044958293437957764, 0.0004807189106941223, 0.000511854887008667, 0.0005429908633232117, 0.0005741268396377563, 0.000605262815952301, 0.0006363987922668457, 0.0006675347685813904, 0.0006986707448959351, 0.0007298067212104797, 0.0007609426975250244, 0.0007920786738395691, 0.0008232146501541138, 0.0008543506264686584, 0.0008854866027832031]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 8.0, 6.0, 28.0, 44.0, 57.0, 114.0, 249.0, 672.0, 2001.0, 10711.0, 280720.0, 731914.0, 17784.0, 2872.0, 784.0, 291.0, 121.0, 66.0, 41.0, 24.0, 11.0, 11.0, 2.0, 5.0, 3.0, 2.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.335479736328125, -3.18463134765625, -3.033782958984375, -2.8829345703125, -2.732086181640625, -2.58123779296875, -2.430389404296875, -2.279541015625, -2.128692626953125, -1.97784423828125, -1.826995849609375, -1.6761474609375, -1.525299072265625, -1.37445068359375, -1.223602294921875, -1.07275390625, -0.921905517578125, -0.77105712890625, -0.620208740234375, -0.4693603515625, -0.318511962890625, -0.16766357421875, -0.016815185546875, 0.134033203125, 0.284881591796875, 0.43572998046875, 0.586578369140625, 0.7374267578125, 0.888275146484375, 1.03912353515625, 1.189971923828125, 1.3408203125, 1.491668701171875, 1.64251708984375, 1.793365478515625, 1.9442138671875, 2.095062255859375, 2.24591064453125, 2.396759033203125, 2.547607421875, 2.698455810546875, 2.84930419921875, 3.000152587890625, 3.1510009765625, 3.301849365234375, 3.45269775390625, 3.603546142578125, 3.75439453125, 3.905242919921875, 4.05609130859375, 4.206939697265625, 4.3577880859375, 4.508636474609375, 4.65948486328125, 4.810333251953125, 4.961181640625, 5.112030029296875, 5.26287841796875, 5.413726806640625, 5.5645751953125, 5.715423583984375, 5.86627197265625, 6.017120361328125, 6.16796875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 5.0, 6.0, 4.0, 9.0, 9.0, 17.0, 16.0, 22.0, 41.0, 53.0, 90.0, 120.0, 152.0, 128.0, 123.0, 54.0, 45.0, 25.0, 19.0, 24.0, 14.0, 9.0, 5.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.79296875, -3.680023193359375, -3.56707763671875, -3.454132080078125, -3.3411865234375, -3.228240966796875, -3.11529541015625, -3.002349853515625, -2.889404296875, -2.776458740234375, -2.66351318359375, -2.550567626953125, -2.4376220703125, -2.324676513671875, -2.21173095703125, -2.098785400390625, -1.98583984375, -1.872894287109375, -1.75994873046875, -1.647003173828125, -1.5340576171875, -1.421112060546875, -1.30816650390625, -1.195220947265625, -1.082275390625, -0.969329833984375, -0.85638427734375, -0.743438720703125, -0.6304931640625, -0.517547607421875, -0.40460205078125, -0.291656494140625, -0.1787109375, -0.065765380859375, 0.04718017578125, 0.160125732421875, 0.2730712890625, 0.386016845703125, 0.49896240234375, 0.611907958984375, 0.724853515625, 0.837799072265625, 0.95074462890625, 1.063690185546875, 1.1766357421875, 1.289581298828125, 1.40252685546875, 1.515472412109375, 1.62841796875, 1.741363525390625, 1.85430908203125, 1.967254638671875, 2.0802001953125, 2.193145751953125, 2.30609130859375, 2.419036865234375, 2.531982421875, 2.644927978515625, 2.75787353515625, 2.870819091796875, 2.9837646484375, 3.096710205078125, 3.20965576171875, 3.322601318359375, 3.435546875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 4.0, 3.0, 10.0, 17.0, 44.0, 81.0, 177.0, 279.0, 204.0, 105.0, 47.0, 15.0, 13.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.69265747070312, -70.8166732788086, -67.94068908691406, -65.06470489501953, -62.188716888427734, -59.3127326965332, -56.436744689941406, -53.560760498046875, -50.684776306152344, -47.80879211425781, -44.93280792236328, -42.056819915771484, -39.18083572387695, -36.30485153198242, -33.428863525390625, -30.552879333496094, -27.676895141601562, -24.80091094970703, -21.924924850463867, -19.048938751220703, -16.172954559326172, -13.296969413757324, -10.420984268188477, -7.5449981689453125, -4.669013977050781, -1.7930288314819336, 1.082956314086914, 3.9589414596557617, 6.834926605224609, 9.710911750793457, 12.586896896362305, 15.462882995605469, 18.33885955810547, 21.21484375, 24.090829849243164, 26.966815948486328, 29.84280014038086, 32.71878433227539, 35.59477233886719, 38.47075653076172, 41.34674072265625, 44.22272491455078, 47.09870910644531, 49.97469711303711, 52.85068130493164, 55.72666549682617, 58.60265350341797, 61.4786376953125, 64.35462188720703, 67.23060607910156, 70.1065902709961, 72.98257446289062, 75.85856628417969, 78.73455047607422, 81.61053466796875, 84.48651885986328, 87.36250305175781, 90.23848724365234, 93.11447143554688, 95.9904556274414, 98.86643981933594, 101.742431640625, 104.61841583251953, 107.49440002441406, 110.3703842163086]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 7.0, 7.0, 12.0, 11.0, 13.0, 11.0, 17.0, 14.0, 19.0, 21.0, 29.0, 24.0, 39.0, 30.0, 41.0, 42.0, 44.0, 46.0, 43.0, 46.0, 43.0, 42.0, 42.0, 41.0, 32.0, 29.0, 28.0, 30.0, 26.0, 22.0, 28.0, 21.0, 21.0, 19.0, 9.0, 12.0, 8.0, 7.0, 6.0, 9.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.289255142211914, -23.3831844329834, -22.477113723754883, -21.571044921875, -20.664974212646484, -19.75890350341797, -18.852832794189453, -17.946762084960938, -17.040691375732422, -16.134620666503906, -15.228550910949707, -14.322480201721191, -13.416410446166992, -12.510339736938477, -11.604269027709961, -10.698198318481445, -9.792129516601562, -8.886058807373047, -7.979989051818848, -7.073918342590332, -6.167848110198975, -5.261777877807617, -4.355707168579102, -3.449636936187744, -2.5435667037963867, -1.6374963521957397, -0.7314260005950928, 0.17464447021484375, 1.0807147026062012, 1.9867849349975586, 2.892855644226074, 3.7989258766174316, 4.704994201660156, 5.611064434051514, 6.517134666442871, 7.423205375671387, 8.329275131225586, 9.235345840454102, 10.141416549682617, 11.047487258911133, 11.953557014465332, 12.859627723693848, 13.765697479248047, 14.671768188476562, 15.577838897705078, 16.483909606933594, 17.38998031616211, 18.296049118041992, 19.202119827270508, 20.108190536499023, 21.01426124572754, 21.920330047607422, 22.826400756835938, 23.732471466064453, 24.63854217529297, 25.544612884521484, 26.45068359375, 27.356754302978516, 28.26282501220703, 29.168895721435547, 30.07496452331543, 30.981035232543945, 31.88710594177246, 32.793174743652344, 33.69924545288086]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 4.0, 1.0, 4.0, 6.0, 6.0, 13.0, 23.0, 15.0, 25.0, 47.0, 57.0, 88.0, 139.0, 207.0, 369.0, 753.0, 1840.0, 8711.0, 4161456.0, 16202.0, 2328.0, 813.0, 430.0, 247.0, 143.0, 88.0, 55.0, 40.0, 40.0, 25.0, 30.0, 19.0, 11.0, 6.0, 8.0, 6.0, 5.0, 3.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.7265625, -14.3131103515625, -13.899658203125, -13.4862060546875, -13.07275390625, -12.6593017578125, -12.245849609375, -11.8323974609375, -11.4189453125, -11.0054931640625, -10.592041015625, -10.1785888671875, -9.76513671875, -9.3516845703125, -8.938232421875, -8.5247802734375, -8.111328125, -7.6978759765625, -7.284423828125, -6.8709716796875, -6.45751953125, -6.0440673828125, -5.630615234375, -5.2171630859375, -4.8037109375, -4.3902587890625, -3.976806640625, -3.5633544921875, -3.14990234375, -2.7364501953125, -2.322998046875, -1.9095458984375, -1.49609375, -1.0826416015625, -0.669189453125, -0.2557373046875, 0.15771484375, 0.5711669921875, 0.984619140625, 1.3980712890625, 1.8115234375, 2.2249755859375, 2.638427734375, 3.0518798828125, 3.46533203125, 3.8787841796875, 4.292236328125, 4.7056884765625, 5.119140625, 5.5325927734375, 5.946044921875, 6.3594970703125, 6.77294921875, 7.1864013671875, 7.599853515625, 8.0133056640625, 8.4267578125, 8.8402099609375, 9.253662109375, 9.6671142578125, 10.08056640625, 10.4940185546875, 10.907470703125, 11.3209228515625, 11.734375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 7.0, 5.0, 9.0, 15.0, 20.0, 33.0, 48.0, 38.0, 55.0, 58.0, 70.0, 88.0, 77.0, 88.0, 81.0, 74.0, 56.0, 58.0, 25.0, 28.0, 18.0, 13.0, 12.0, 13.0, 3.0, 6.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98828125, -2.893798828125, -2.79931640625, -2.704833984375, -2.6103515625, -2.515869140625, -2.42138671875, -2.326904296875, -2.232421875, -2.137939453125, -2.04345703125, -1.948974609375, -1.8544921875, -1.760009765625, -1.66552734375, -1.571044921875, -1.4765625, -1.382080078125, -1.28759765625, -1.193115234375, -1.0986328125, -1.004150390625, -0.90966796875, -0.815185546875, -0.720703125, -0.626220703125, -0.53173828125, -0.437255859375, -0.3427734375, -0.248291015625, -0.15380859375, -0.059326171875, 0.03515625, 0.129638671875, 0.22412109375, 0.318603515625, 0.4130859375, 0.507568359375, 0.60205078125, 0.696533203125, 0.791015625, 0.885498046875, 0.97998046875, 1.074462890625, 1.1689453125, 1.263427734375, 1.35791015625, 1.452392578125, 1.546875, 1.641357421875, 1.73583984375, 1.830322265625, 1.9248046875, 2.019287109375, 2.11376953125, 2.208251953125, 2.302734375, 2.397216796875, 2.49169921875, 2.586181640625, 2.6806640625, 2.775146484375, 2.86962890625, 2.964111328125, 3.05859375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 5.0, 3.0, 5.0, 10.0, 6.0, 8.0, 10.0, 30.0, 26.0, 39.0, 33.0, 60.0, 78.0, 124.0, 185.0, 461.0, 1213.0, 4890.0, 4130768.0, 50927.0, 3501.0, 957.0, 348.0, 186.0, 100.0, 82.0, 58.0, 41.0, 29.0, 23.0, 17.0, 16.0, 11.0, 3.0, 11.0, 8.0, 3.0, 4.0, 4.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.734375, -16.9921875, -16.25, -15.5078125, -14.765625, -14.0234375, -13.28125, -12.5390625, -11.796875, -11.0546875, -10.3125, -9.5703125, -8.828125, -8.0859375, -7.34375, -6.6015625, -5.859375, -5.1171875, -4.375, -3.6328125, -2.890625, -2.1484375, -1.40625, -0.6640625, 0.078125, 0.8203125, 1.5625, 2.3046875, 3.046875, 3.7890625, 4.53125, 5.2734375, 6.015625, 6.7578125, 7.5, 8.2421875, 8.984375, 9.7265625, 10.46875, 11.2109375, 11.953125, 12.6953125, 13.4375, 14.1796875, 14.921875, 15.6640625, 16.40625, 17.1484375, 17.890625, 18.6328125, 19.375, 20.1171875, 20.859375, 21.6015625, 22.34375, 23.0859375, 23.828125, 24.5703125, 25.3125, 26.0546875, 26.796875, 27.5390625, 28.28125, 29.0234375, 29.765625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 16.0, 24.0, 3955.0, 53.0, 17.0, 4.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8505859375, -1.6746978759765625, -1.498809814453125, -1.3229217529296875, -1.14703369140625, -0.9711456298828125, -0.795257568359375, -0.6193695068359375, -0.4434814453125, -0.2675933837890625, -0.091705322265625, 0.0841827392578125, 0.26007080078125, 0.4359588623046875, 0.611846923828125, 0.7877349853515625, 0.963623046875, 1.1395111083984375, 1.315399169921875, 1.4912872314453125, 1.66717529296875, 1.8430633544921875, 2.018951416015625, 2.1948394775390625, 2.3707275390625, 2.5466156005859375, 2.722503662109375, 2.8983917236328125, 3.07427978515625, 3.2501678466796875, 3.426055908203125, 3.6019439697265625, 3.77783203125, 3.9537200927734375, 4.129608154296875, 4.3054962158203125, 4.48138427734375, 4.6572723388671875, 4.833160400390625, 5.0090484619140625, 5.1849365234375, 5.3608245849609375, 5.536712646484375, 5.7126007080078125, 5.88848876953125, 6.0643768310546875, 6.240264892578125, 6.4161529541015625, 6.592041015625, 6.7679290771484375, 6.943817138671875, 7.1197052001953125, 7.29559326171875, 7.4714813232421875, 7.647369384765625, 7.8232574462890625, 7.9991455078125, 8.175033569335938, 8.350921630859375, 8.526809692382812, 8.70269775390625, 8.878585815429688, 9.054473876953125, 9.230361938476562, 9.40625]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 14.0, 35.0, 47.0, 128.0, 185.0, 177.0, 171.0, 89.0, 44.0, 31.0, 23.0, 15.0, 12.0, 8.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.371984481811523, -11.025482177734375, -10.678979873657227, -10.332477569580078, -9.98597526550293, -9.639473915100098, -9.29297161102295, -8.9464693069458, -8.599967002868652, -8.253464698791504, -7.9069623947143555, -7.560460567474365, -7.213958263397217, -6.867455959320068, -6.520954132080078, -6.17445182800293, -5.827949523925781, -5.481447219848633, -5.134944915771484, -4.788443088531494, -4.441940784454346, -4.095438480377197, -3.748936414718628, -3.4024343490600586, -3.05593204498291, -2.7094297409057617, -2.3629276752471924, -2.016425609588623, -1.6699233055114746, -1.3234211206436157, -0.9769189357757568, -0.6304168701171875, -0.28391361236572266, 0.06258857250213623, 0.4090907573699951, 0.755592942237854, 1.102095127105713, 1.4485973119735718, 1.7950994968414307, 2.1416015625, 2.4881038665771484, 2.834606170654297, 3.181108236312866, 3.5276103019714355, 3.874112606048584, 4.220614910125732, 4.567116737365723, 4.913619041442871, 5.2601213455200195, 5.606623649597168, 5.953125953674316, 6.299627780914307, 6.646130084991455, 6.9926323890686035, 7.339134216308594, 7.685636520385742, 8.03213882446289, 8.378641128540039, 8.725143432617188, 9.071645736694336, 9.418148040771484, 9.764649391174316, 10.111151695251465, 10.457653999328613, 10.804156303405762]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 5.0, 10.0, 15.0, 20.0, 12.0, 20.0, 17.0, 21.0, 24.0, 30.0, 27.0, 22.0, 32.0, 37.0, 39.0, 34.0, 37.0, 40.0, 31.0, 39.0, 30.0, 40.0, 47.0, 31.0, 33.0, 29.0, 27.0, 22.0, 31.0, 20.0, 16.0, 21.0, 23.0, 22.0, 16.0, 12.0, 17.0, 13.0, 3.0, 8.0, 10.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.399012565612793, -5.236536502838135, -5.074060440063477, -4.911584854125977, -4.749108791351318, -4.58663272857666, -4.42415714263916, -4.261681079864502, -4.099205017089844, -3.9367289543151855, -3.7742531299591064, -3.6117773056030273, -3.449301242828369, -3.286825180053711, -3.124349355697632, -2.9618735313415527, -2.7993974685668945, -2.6369214057922363, -2.4744455814361572, -2.311969757080078, -2.14949369430542, -1.9870177507400513, -1.8245418071746826, -1.662065863609314, -1.4995899200439453, -1.3371139764785767, -1.174638032913208, -1.0121620893478394, -0.8496861457824707, -0.687210202217102, -0.5247342586517334, -0.36225831508636475, -0.1997823715209961, -0.03730642795562744, 0.1251695156097412, 0.28764545917510986, 0.4501214027404785, 0.6125973463058472, 0.7750732898712158, 0.9375492334365845, 1.1000251770019531, 1.2625011205673218, 1.4249770641326904, 1.587453007698059, 1.7499289512634277, 1.9124048948287964, 2.074880838394165, 2.237356662750244, 2.3998327255249023, 2.5623087882995605, 2.7247846126556396, 2.8872604370117188, 3.049736499786377, 3.212212562561035, 3.3746883869171143, 3.5371642112731934, 3.6996402740478516, 3.8621163368225098, 4.024592399597168, 4.187067985534668, 4.349544048309326, 4.512020111083984, 4.674495697021484, 4.836971759796143, 4.999447822570801]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 7.0, 13.0, 15.0, 17.0, 27.0, 36.0, 56.0, 81.0, 100.0, 196.0, 301.0, 493.0, 913.0, 1686.0, 3244.0, 6839.0, 16391.0, 46871.0, 161007.0, 485326.0, 225295.0, 61523.0, 21090.0, 8569.0, 3894.0, 1898.0, 1059.0, 620.0, 362.0, 228.0, 147.0, 96.0, 50.0, 36.0, 25.0, 15.0, 11.0, 6.0, 3.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.5703125, -4.4420166015625, -4.313720703125, -4.1854248046875, -4.05712890625, -3.9288330078125, -3.800537109375, -3.6722412109375, -3.5439453125, -3.4156494140625, -3.287353515625, -3.1590576171875, -3.03076171875, -2.9024658203125, -2.774169921875, -2.6458740234375, -2.517578125, -2.3892822265625, -2.260986328125, -2.1326904296875, -2.00439453125, -1.8760986328125, -1.747802734375, -1.6195068359375, -1.4912109375, -1.3629150390625, -1.234619140625, -1.1063232421875, -0.97802734375, -0.8497314453125, -0.721435546875, -0.5931396484375, -0.46484375, -0.3365478515625, -0.208251953125, -0.0799560546875, 0.04833984375, 0.1766357421875, 0.304931640625, 0.4332275390625, 0.5615234375, 0.6898193359375, 0.818115234375, 0.9464111328125, 1.07470703125, 1.2030029296875, 1.331298828125, 1.4595947265625, 1.587890625, 1.7161865234375, 1.844482421875, 1.9727783203125, 2.10107421875, 2.2293701171875, 2.357666015625, 2.4859619140625, 2.6142578125, 2.7425537109375, 2.870849609375, 2.9991455078125, 3.12744140625, 3.2557373046875, 3.384033203125, 3.5123291015625, 3.640625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 0.0, 4.0, 8.0, 8.0, 16.0, 8.0, 17.0, 21.0, 18.0, 26.0, 33.0, 38.0, 40.0, 56.0, 54.0, 51.0, 58.0, 63.0, 65.0, 54.0, 56.0, 41.0, 42.0, 38.0, 33.0, 35.0, 18.0, 24.0, 17.0, 13.0, 16.0, 8.0, 5.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.400390625, -2.322357177734375, -2.24432373046875, -2.166290283203125, -2.0882568359375, -2.010223388671875, -1.93218994140625, -1.854156494140625, -1.776123046875, -1.698089599609375, -1.62005615234375, -1.542022705078125, -1.4639892578125, -1.385955810546875, -1.30792236328125, -1.229888916015625, -1.15185546875, -1.073822021484375, -0.99578857421875, -0.917755126953125, -0.8397216796875, -0.761688232421875, -0.68365478515625, -0.605621337890625, -0.527587890625, -0.449554443359375, -0.37152099609375, -0.293487548828125, -0.2154541015625, -0.137420654296875, -0.05938720703125, 0.018646240234375, 0.0966796875, 0.174713134765625, 0.25274658203125, 0.330780029296875, 0.4088134765625, 0.486846923828125, 0.56488037109375, 0.642913818359375, 0.720947265625, 0.798980712890625, 0.87701416015625, 0.955047607421875, 1.0330810546875, 1.111114501953125, 1.18914794921875, 1.267181396484375, 1.34521484375, 1.423248291015625, 1.50128173828125, 1.579315185546875, 1.6573486328125, 1.735382080078125, 1.81341552734375, 1.891448974609375, 1.969482421875, 2.047515869140625, 2.12554931640625, 2.203582763671875, 2.2816162109375, 2.359649658203125, 2.43768310546875, 2.515716552734375, 2.59375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 17.0, 9.0, 16.0, 27.0, 33.0, 68.0, 100.0, 178.0, 400.0, 1091.0, 3804.0, 18808.0, 296310.0, 688640.0, 31411.0, 5098.0, 1486.0, 516.0, 226.0, 107.0, 64.0, 50.0, 24.0, 19.0, 8.0, 9.0, 7.0, 5.0, 6.0, 4.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.5859375, -14.1929931640625, -13.800048828125, -13.4071044921875, -13.01416015625, -12.6212158203125, -12.228271484375, -11.8353271484375, -11.4423828125, -11.0494384765625, -10.656494140625, -10.2635498046875, -9.87060546875, -9.4776611328125, -9.084716796875, -8.6917724609375, -8.298828125, -7.9058837890625, -7.512939453125, -7.1199951171875, -6.72705078125, -6.3341064453125, -5.941162109375, -5.5482177734375, -5.1552734375, -4.7623291015625, -4.369384765625, -3.9764404296875, -3.58349609375, -3.1905517578125, -2.797607421875, -2.4046630859375, -2.01171875, -1.6187744140625, -1.225830078125, -0.8328857421875, -0.43994140625, -0.0469970703125, 0.345947265625, 0.7388916015625, 1.1318359375, 1.5247802734375, 1.917724609375, 2.3106689453125, 2.70361328125, 3.0965576171875, 3.489501953125, 3.8824462890625, 4.275390625, 4.6683349609375, 5.061279296875, 5.4542236328125, 5.84716796875, 6.2401123046875, 6.633056640625, 7.0260009765625, 7.4189453125, 7.8118896484375, 8.204833984375, 8.5977783203125, 8.99072265625, 9.3836669921875, 9.776611328125, 10.1695556640625, 10.5625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 10.0, 12.0, 21.0, 28.0, 21.0, 31.0, 39.0, 31.0, 62.0, 61.0, 50.0, 69.0, 66.0, 53.0, 67.0, 64.0, 52.0, 49.0, 41.0, 37.0, 25.0, 18.0, 20.0, 13.0, 13.0, 11.0, 5.0, 5.0, 5.0, 1.0, 3.0, 5.0, 4.0, 1.0, 3.0, 4.0], "bins": [-19.140625, -18.6708984375, -18.201171875, -17.7314453125, -17.26171875, -16.7919921875, -16.322265625, -15.8525390625, -15.3828125, -14.9130859375, -14.443359375, -13.9736328125, -13.50390625, -13.0341796875, -12.564453125, -12.0947265625, -11.625, -11.1552734375, -10.685546875, -10.2158203125, -9.74609375, -9.2763671875, -8.806640625, -8.3369140625, -7.8671875, -7.3974609375, -6.927734375, -6.4580078125, -5.98828125, -5.5185546875, -5.048828125, -4.5791015625, -4.109375, -3.6396484375, -3.169921875, -2.7001953125, -2.23046875, -1.7607421875, -1.291015625, -0.8212890625, -0.3515625, 0.1181640625, 0.587890625, 1.0576171875, 1.52734375, 1.9970703125, 2.466796875, 2.9365234375, 3.40625, 3.8759765625, 4.345703125, 4.8154296875, 5.28515625, 5.7548828125, 6.224609375, 6.6943359375, 7.1640625, 7.6337890625, 8.103515625, 8.5732421875, 9.04296875, 9.5126953125, 9.982421875, 10.4521484375, 10.921875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 10.0, 6.0, 8.0, 13.0, 24.0, 32.0, 72.0, 121.0, 204.0, 382.0, 906.0, 2511.0, 11368.0, 218475.0, 784587.0, 23569.0, 3980.0, 1182.0, 520.0, 235.0, 136.0, 80.0, 48.0, 24.0, 9.0, 15.0, 8.0, 7.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.83203125, -5.66619873046875, -5.5003662109375, -5.33453369140625, -5.168701171875, -5.00286865234375, -4.8370361328125, -4.67120361328125, -4.50537109375, -4.33953857421875, -4.1737060546875, -4.00787353515625, -3.842041015625, -3.67620849609375, -3.5103759765625, -3.34454345703125, -3.1787109375, -3.01287841796875, -2.8470458984375, -2.68121337890625, -2.515380859375, -2.34954833984375, -2.1837158203125, -2.01788330078125, -1.85205078125, -1.68621826171875, -1.5203857421875, -1.35455322265625, -1.188720703125, -1.02288818359375, -0.8570556640625, -0.69122314453125, -0.525390625, -0.35955810546875, -0.1937255859375, -0.02789306640625, 0.137939453125, 0.30377197265625, 0.4696044921875, 0.63543701171875, 0.80126953125, 0.96710205078125, 1.1329345703125, 1.29876708984375, 1.464599609375, 1.63043212890625, 1.7962646484375, 1.96209716796875, 2.1279296875, 2.29376220703125, 2.4595947265625, 2.62542724609375, 2.791259765625, 2.95709228515625, 3.1229248046875, 3.28875732421875, 3.45458984375, 3.62042236328125, 3.7862548828125, 3.95208740234375, 4.117919921875, 4.28375244140625, 4.4495849609375, 4.61541748046875, 4.78125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 13.0, 19.0, 20.0, 36.0, 64.0, 111.0, 152.0, 176.0, 148.0, 105.0, 58.0, 31.0, 25.0, 11.0, 9.0, 2.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008401870727539062, -0.0008170530200004578, -0.0007939189672470093, -0.0007707849144935608, -0.0007476508617401123, -0.0007245168089866638, -0.0007013827562332153, -0.0006782487034797668, -0.0006551146507263184, -0.0006319805979728699, -0.0006088465452194214, -0.0005857124924659729, -0.0005625784397125244, -0.0005394443869590759, -0.0005163103342056274, -0.000493176281452179, -0.00047004222869873047, -0.000446908175945282, -0.0004237741231918335, -0.000400640070438385, -0.0003775060176849365, -0.00035437196493148804, -0.00033123791217803955, -0.00030810385942459106, -0.0002849698066711426, -0.0002618357539176941, -0.0002387017011642456, -0.00021556764841079712, -0.00019243359565734863, -0.00016929954290390015, -0.00014616549015045166, -0.00012303143739700317, -9.989738464355469e-05, -7.67633318901062e-05, -5.3629279136657715e-05, -3.049522638320923e-05, -7.361173629760742e-06, 1.5772879123687744e-05, 3.890693187713623e-05, 6.204098463058472e-05, 8.51750373840332e-05, 0.00010830909013748169, 0.00013144314289093018, 0.00015457719564437866, 0.00017771124839782715, 0.00020084530115127563, 0.00022397935390472412, 0.0002471134066581726, 0.0002702474594116211, 0.0002933815121650696, 0.00031651556491851807, 0.00033964961767196655, 0.00036278367042541504, 0.0003859177231788635, 0.000409051775932312, 0.0004321858286857605, 0.000455319881439209, 0.00047845393419265747, 0.000501587986946106, 0.0005247220396995544, 0.0005478560924530029, 0.0005709901452064514, 0.0005941241979598999, 0.0006172582507133484, 0.0006403923034667969]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 9.0, 13.0, 17.0, 25.0, 30.0, 62.0, 113.0, 165.0, 312.0, 643.0, 1326.0, 3264.0, 12311.0, 130207.0, 834030.0, 53634.0, 7820.0, 2461.0, 962.0, 475.0, 247.0, 151.0, 102.0, 55.0, 35.0, 20.0, 14.0, 12.0, 9.0, 6.0, 3.0, 2.0, 5.0, 0.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.150390625, -3.009429931640625, -2.86846923828125, -2.727508544921875, -2.5865478515625, -2.445587158203125, -2.30462646484375, -2.163665771484375, -2.022705078125, -1.881744384765625, -1.74078369140625, -1.599822998046875, -1.4588623046875, -1.317901611328125, -1.17694091796875, -1.035980224609375, -0.89501953125, -0.754058837890625, -0.61309814453125, -0.472137451171875, -0.3311767578125, -0.190216064453125, -0.04925537109375, 0.091705322265625, 0.232666015625, 0.373626708984375, 0.51458740234375, 0.655548095703125, 0.7965087890625, 0.937469482421875, 1.07843017578125, 1.219390869140625, 1.3603515625, 1.501312255859375, 1.64227294921875, 1.783233642578125, 1.9241943359375, 2.065155029296875, 2.20611572265625, 2.347076416015625, 2.488037109375, 2.628997802734375, 2.76995849609375, 2.910919189453125, 3.0518798828125, 3.192840576171875, 3.33380126953125, 3.474761962890625, 3.61572265625, 3.756683349609375, 3.89764404296875, 4.038604736328125, 4.1795654296875, 4.320526123046875, 4.46148681640625, 4.602447509765625, 4.743408203125, 4.884368896484375, 5.02532958984375, 5.166290283203125, 5.3072509765625, 5.448211669921875, 5.58917236328125, 5.730133056640625, 5.87109375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 1.0, 1.0, 8.0, 10.0, 7.0, 18.0, 37.0, 84.0, 146.0, 229.0, 207.0, 102.0, 62.0, 33.0, 11.0, 13.0, 4.0, 2.0, 6.0, 5.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.09375, -4.8697509765625, -4.645751953125, -4.4217529296875, -4.19775390625, -3.9737548828125, -3.749755859375, -3.5257568359375, -3.3017578125, -3.0777587890625, -2.853759765625, -2.6297607421875, -2.40576171875, -2.1817626953125, -1.957763671875, -1.7337646484375, -1.509765625, -1.2857666015625, -1.061767578125, -0.8377685546875, -0.61376953125, -0.3897705078125, -0.165771484375, 0.0582275390625, 0.2822265625, 0.5062255859375, 0.730224609375, 0.9542236328125, 1.17822265625, 1.4022216796875, 1.626220703125, 1.8502197265625, 2.07421875, 2.2982177734375, 2.522216796875, 2.7462158203125, 2.97021484375, 3.1942138671875, 3.418212890625, 3.6422119140625, 3.8662109375, 4.0902099609375, 4.314208984375, 4.5382080078125, 4.76220703125, 4.9862060546875, 5.210205078125, 5.4342041015625, 5.658203125, 5.8822021484375, 6.106201171875, 6.3302001953125, 6.55419921875, 6.7781982421875, 7.002197265625, 7.2261962890625, 7.4501953125, 7.6741943359375, 7.898193359375, 8.1221923828125, 8.34619140625, 8.5701904296875, 8.794189453125, 9.0181884765625, 9.2421875]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 0.0, 2.0, 7.0, 2.0, 5.0, 14.0, 13.0, 13.0, 37.0, 59.0, 102.0, 149.0, 146.0, 129.0, 97.0, 71.0, 58.0, 33.0, 23.0, 10.0, 9.0, 11.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.8477897644043, -44.08858871459961, -42.32938766479492, -40.5701904296875, -38.81098937988281, -37.051788330078125, -35.29258728027344, -33.53338623046875, -31.774187088012695, -30.014986038208008, -28.255786895751953, -26.496585845947266, -24.737384796142578, -22.978185653686523, -21.218984603881836, -19.45978546142578, -17.700584411621094, -15.941384315490723, -14.182184219360352, -12.422983169555664, -10.663783073425293, -8.904582977294922, -7.145381927490234, -5.386181831359863, -3.626981735229492, -1.867781400680542, -0.1085810661315918, 1.6506195068359375, 3.4098196029663086, 5.16901969909668, 6.928220748901367, 8.687420845031738, 10.446624755859375, 12.205824851989746, 13.965024948120117, 15.724225997924805, 17.48342514038086, 19.242626190185547, 21.001827239990234, 22.761028289794922, 24.520227432250977, 26.279428482055664, 28.03862762451172, 29.797828674316406, 31.557029724121094, 33.31623077392578, 35.07543182373047, 36.83462905883789, 38.59383010864258, 40.353031158447266, 42.11223220825195, 43.871429443359375, 45.63063049316406, 47.38983154296875, 49.14903259277344, 50.908233642578125, 52.66743469238281, 54.4266357421875, 56.18583679199219, 57.945037841796875, 59.7042350769043, 61.463436126708984, 63.22263717651367, 64.9818344116211, 66.74103546142578]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 5.0, 3.0, 9.0, 11.0, 19.0, 17.0, 20.0, 22.0, 28.0, 39.0, 47.0, 51.0, 54.0, 62.0, 70.0, 69.0, 79.0, 53.0, 51.0, 46.0, 45.0, 32.0, 30.0, 25.0, 25.0, 16.0, 12.0, 19.0, 6.0, 10.0, 3.0, 6.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-77.399658203125, -75.28307342529297, -73.1664810180664, -71.04989624023438, -68.93330383300781, -66.81671905517578, -64.70012664794922, -62.58354187011719, -60.466949462890625, -58.35036087036133, -56.23377227783203, -54.117183685302734, -52.00059509277344, -49.88400650024414, -47.767417907714844, -45.65083312988281, -43.534244537353516, -41.41765594482422, -39.30106735229492, -37.184478759765625, -35.06789016723633, -32.95130157470703, -30.834714889526367, -28.71812629699707, -26.601537704467773, -24.484949111938477, -22.36836051940918, -20.251773834228516, -18.13518524169922, -16.018596649169922, -13.902008056640625, -11.785419464111328, -9.668827056884766, -7.552238464355469, -5.43565034866333, -3.3190622329711914, -1.2024736404418945, 0.9141149520874023, 3.030702590942383, 5.14729118347168, 7.263879776000977, 9.380468368530273, 11.49705696105957, 13.61364459991455, 15.730233192443848, 17.846820831298828, 19.963409423828125, 22.079998016357422, 24.19658660888672, 26.313175201416016, 28.429763793945312, 30.54635238647461, 32.662940979003906, 34.7795295715332, 36.8961181640625, 39.01270294189453, 41.129295349121094, 43.24588394165039, 45.36247253417969, 47.479061126708984, 49.59564971923828, 51.71223831176758, 53.828826904296875, 55.945411682128906, 58.0620002746582]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 2.0, 5.0, 9.0, 14.0, 17.0, 19.0, 46.0, 60.0, 75.0, 153.0, 295.0, 651.0, 1774.0, 7827.0, 4152742.0, 25629.0, 3031.0, 965.0, 417.0, 213.0, 116.0, 74.0, 43.0, 22.0, 21.0, 7.0, 15.0, 11.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-24.90625, -24.3092041015625, -23.712158203125, -23.1151123046875, -22.51806640625, -21.9210205078125, -21.323974609375, -20.7269287109375, -20.1298828125, -19.5328369140625, -18.935791015625, -18.3387451171875, -17.74169921875, -17.1446533203125, -16.547607421875, -15.9505615234375, -15.353515625, -14.7564697265625, -14.159423828125, -13.5623779296875, -12.96533203125, -12.3682861328125, -11.771240234375, -11.1741943359375, -10.5771484375, -9.9801025390625, -9.383056640625, -8.7860107421875, -8.18896484375, -7.5919189453125, -6.994873046875, -6.3978271484375, -5.80078125, -5.2037353515625, -4.606689453125, -4.0096435546875, -3.41259765625, -2.8155517578125, -2.218505859375, -1.6214599609375, -1.0244140625, -0.4273681640625, 0.169677734375, 0.7667236328125, 1.36376953125, 1.9608154296875, 2.557861328125, 3.1549072265625, 3.751953125, 4.3489990234375, 4.946044921875, 5.5430908203125, 6.14013671875, 6.7371826171875, 7.334228515625, 7.9312744140625, 8.5283203125, 9.1253662109375, 9.722412109375, 10.3194580078125, 10.91650390625, 11.5135498046875, 12.110595703125, 12.7076416015625, 13.3046875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 15.0, 28.0, 44.0, 96.0, 139.0, 198.0, 166.0, 140.0, 68.0, 48.0, 35.0, 14.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.53125, -11.25616455078125, -10.9810791015625, -10.70599365234375, -10.430908203125, -10.15582275390625, -9.8807373046875, -9.60565185546875, -9.33056640625, -9.05548095703125, -8.7803955078125, -8.50531005859375, -8.230224609375, -7.95513916015625, -7.6800537109375, -7.40496826171875, -7.1298828125, -6.85479736328125, -6.5797119140625, -6.30462646484375, -6.029541015625, -5.75445556640625, -5.4793701171875, -5.20428466796875, -4.92919921875, -4.65411376953125, -4.3790283203125, -4.10394287109375, -3.828857421875, -3.55377197265625, -3.2786865234375, -3.00360107421875, -2.728515625, -2.45343017578125, -2.1783447265625, -1.90325927734375, -1.628173828125, -1.35308837890625, -1.0780029296875, -0.80291748046875, -0.52783203125, -0.25274658203125, 0.0223388671875, 0.29742431640625, 0.572509765625, 0.84759521484375, 1.1226806640625, 1.39776611328125, 1.6728515625, 1.94793701171875, 2.2230224609375, 2.49810791015625, 2.773193359375, 3.04827880859375, 3.3233642578125, 3.59844970703125, 3.87353515625, 4.14862060546875, 4.4237060546875, 4.69879150390625, 4.973876953125, 5.24896240234375, 5.5240478515625, 5.79913330078125, 6.07421875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 1.0, 4.0, 7.0, 7.0, 10.0, 18.0, 27.0, 29.0, 41.0, 35.0, 57.0, 77.0, 141.0, 190.0, 278.0, 467.0, 852.0, 1826.0, 5986.0, 98716.0, 4072635.0, 8145.0, 2247.0, 996.0, 454.0, 313.0, 222.0, 150.0, 101.0, 61.0, 55.0, 37.0, 29.0, 17.0, 13.0, 12.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.21875, -23.487060546875, -22.75537109375, -22.023681640625, -21.2919921875, -20.560302734375, -19.82861328125, -19.096923828125, -18.365234375, -17.633544921875, -16.90185546875, -16.170166015625, -15.4384765625, -14.706787109375, -13.97509765625, -13.243408203125, -12.51171875, -11.780029296875, -11.04833984375, -10.316650390625, -9.5849609375, -8.853271484375, -8.12158203125, -7.389892578125, -6.658203125, -5.926513671875, -5.19482421875, -4.463134765625, -3.7314453125, -2.999755859375, -2.26806640625, -1.536376953125, -0.8046875, -0.072998046875, 0.65869140625, 1.390380859375, 2.1220703125, 2.853759765625, 3.58544921875, 4.317138671875, 5.048828125, 5.780517578125, 6.51220703125, 7.243896484375, 7.9755859375, 8.707275390625, 9.43896484375, 10.170654296875, 10.90234375, 11.634033203125, 12.36572265625, 13.097412109375, 13.8291015625, 14.560791015625, 15.29248046875, 16.024169921875, 16.755859375, 17.487548828125, 18.21923828125, 18.950927734375, 19.6826171875, 20.414306640625, 21.14599609375, 21.877685546875, 22.609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 8.0, 10.0, 24.0, 516.0, 3470.0, 24.0, 11.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.734375, -18.31842041015625, -17.9024658203125, -17.48651123046875, -17.070556640625, -16.65460205078125, -16.2386474609375, -15.82269287109375, -15.40673828125, -14.99078369140625, -14.5748291015625, -14.15887451171875, -13.742919921875, -13.32696533203125, -12.9110107421875, -12.49505615234375, -12.0791015625, -11.66314697265625, -11.2471923828125, -10.83123779296875, -10.415283203125, -9.99932861328125, -9.5833740234375, -9.16741943359375, -8.75146484375, -8.33551025390625, -7.9195556640625, -7.50360107421875, -7.087646484375, -6.67169189453125, -6.2557373046875, -5.83978271484375, -5.423828125, -5.00787353515625, -4.5919189453125, -4.17596435546875, -3.760009765625, -3.34405517578125, -2.9281005859375, -2.51214599609375, -2.09619140625, -1.68023681640625, -1.2642822265625, -0.84832763671875, -0.432373046875, -0.01641845703125, 0.3995361328125, 0.81549072265625, 1.2314453125, 1.64739990234375, 2.0633544921875, 2.47930908203125, 2.895263671875, 3.31121826171875, 3.7271728515625, 4.14312744140625, 4.55908203125, 4.97503662109375, 5.3909912109375, 5.80694580078125, 6.222900390625, 6.63885498046875, 7.0548095703125, 7.47076416015625, 7.88671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 9.0, 4.0, 12.0, 4.0, 14.0, 23.0, 42.0, 42.0, 81.0, 99.0, 124.0, 149.0, 134.0, 79.0, 65.0, 43.0, 31.0, 18.0, 5.0, 8.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.195390701293945, -17.581708908081055, -16.968027114868164, -16.354345321655273, -15.740663528442383, -15.126981735229492, -14.513300895690918, -13.899619102478027, -13.285937309265137, -12.672255516052246, -12.058573722839355, -11.444891929626465, -10.83121109008789, -10.217529296875, -9.60384750366211, -8.990165710449219, -8.376483917236328, -7.7628021240234375, -7.149120330810547, -6.5354390144348145, -5.921757221221924, -5.308075428009033, -4.694394111633301, -4.08071231842041, -3.4670305252075195, -2.853348731994629, -2.2396671772003174, -1.6259855031967163, -1.0123038291931152, -0.3986220359802246, 0.21505951881408691, 0.8287410736083984, 1.4424247741699219, 2.0561065673828125, 2.669788122177124, 3.2834696769714355, 3.897151470184326, 4.510833263397217, 5.124514579772949, 5.73819637298584, 6.3518781661987305, 6.965559959411621, 7.579241752624512, 8.192923545837402, 8.806604385375977, 9.420286178588867, 10.033967971801758, 10.647649765014648, 11.261331558227539, 11.87501335144043, 12.48869514465332, 13.102376937866211, 13.716058731079102, 14.329740524291992, 14.943421363830566, 15.557103157043457, 16.17078399658203, 16.784465789794922, 17.398147583007812, 18.011829376220703, 18.625511169433594, 19.239192962646484, 19.852874755859375, 20.466556549072266, 21.080238342285156]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 6.0, 8.0, 3.0, 5.0, 7.0, 11.0, 14.0, 15.0, 15.0, 19.0, 17.0, 23.0, 31.0, 30.0, 38.0, 42.0, 32.0, 47.0, 47.0, 37.0, 46.0, 54.0, 56.0, 59.0, 41.0, 48.0, 37.0, 42.0, 37.0, 24.0, 22.0, 19.0, 11.0, 10.0, 12.0, 5.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.887566566467285, -13.414897918701172, -12.942229270935059, -12.469560623168945, -11.996891975402832, -11.524223327636719, -11.051555633544922, -10.578886032104492, -10.106218338012695, -9.633549690246582, -9.160881042480469, -8.688212394714355, -8.215543746948242, -7.742875099182129, -7.270206928253174, -6.7975382804870605, -6.324869155883789, -5.852200508117676, -5.3795318603515625, -4.906863212585449, -4.434194564819336, -3.9615261554718018, -3.4888577461242676, -3.0161890983581543, -2.543520450592041, -2.0708518028259277, -1.598183274269104, -1.1255147457122803, -0.652846097946167, -0.1801774501800537, 0.29249095916748047, 0.7651596069335938, 1.2378292083740234, 1.7104978561401367, 2.18316650390625, 2.655834913253784, 3.1285035610198975, 3.6011722087860107, 4.073840618133545, 4.546509265899658, 5.0191779136657715, 5.491846561431885, 5.964515209197998, 6.437183380126953, 6.909852027893066, 7.38252067565918, 7.855189323425293, 8.327857971191406, 8.80052661895752, 9.273195266723633, 9.745863914489746, 10.21853256225586, 10.691201210021973, 11.163869857788086, 11.636537551879883, 12.109207153320312, 12.58187484741211, 13.054543495178223, 13.527212142944336, 13.99988079071045, 14.472549438476562, 14.945218086242676, 15.417886734008789, 15.890554428100586, 16.363224029541016]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 6.0, 5.0, 14.0, 16.0, 22.0, 50.0, 73.0, 139.0, 280.0, 663.0, 2087.0, 11350.0, 169450.0, 800529.0, 55980.0, 5571.0, 1334.0, 495.0, 216.0, 113.0, 58.0, 43.0, 16.0, 19.0, 9.0, 4.0, 2.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.7265625, -14.2408447265625, -13.755126953125, -13.2694091796875, -12.78369140625, -12.2979736328125, -11.812255859375, -11.3265380859375, -10.8408203125, -10.3551025390625, -9.869384765625, -9.3836669921875, -8.89794921875, -8.4122314453125, -7.926513671875, -7.4407958984375, -6.955078125, -6.4693603515625, -5.983642578125, -5.4979248046875, -5.01220703125, -4.5264892578125, -4.040771484375, -3.5550537109375, -3.0693359375, -2.5836181640625, -2.097900390625, -1.6121826171875, -1.12646484375, -0.6407470703125, -0.155029296875, 0.3306884765625, 0.81640625, 1.3021240234375, 1.787841796875, 2.2735595703125, 2.75927734375, 3.2449951171875, 3.730712890625, 4.2164306640625, 4.7021484375, 5.1878662109375, 5.673583984375, 6.1593017578125, 6.64501953125, 7.1307373046875, 7.616455078125, 8.1021728515625, 8.587890625, 9.0736083984375, 9.559326171875, 10.0450439453125, 10.53076171875, 11.0164794921875, 11.502197265625, 11.9879150390625, 12.4736328125, 12.9593505859375, 13.445068359375, 13.9307861328125, 14.41650390625, 14.9022216796875, 15.387939453125, 15.8736572265625, 16.359375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 20.0, 26.0, 52.0, 40.0, 60.0, 88.0, 106.0, 140.0, 105.0, 103.0, 65.0, 60.0, 53.0, 28.0, 20.0, 8.0, 4.0, 7.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.1796875, -7.97369384765625, -7.7677001953125, -7.56170654296875, -7.355712890625, -7.14971923828125, -6.9437255859375, -6.73773193359375, -6.53173828125, -6.32574462890625, -6.1197509765625, -5.91375732421875, -5.707763671875, -5.50177001953125, -5.2957763671875, -5.08978271484375, -4.8837890625, -4.67779541015625, -4.4718017578125, -4.26580810546875, -4.059814453125, -3.85382080078125, -3.6478271484375, -3.44183349609375, -3.23583984375, -3.02984619140625, -2.8238525390625, -2.61785888671875, -2.411865234375, -2.20587158203125, -1.9998779296875, -1.79388427734375, -1.587890625, -1.38189697265625, -1.1759033203125, -0.96990966796875, -0.763916015625, -0.55792236328125, -0.3519287109375, -0.14593505859375, 0.06005859375, 0.26605224609375, 0.4720458984375, 0.67803955078125, 0.884033203125, 1.09002685546875, 1.2960205078125, 1.50201416015625, 1.7080078125, 1.91400146484375, 2.1199951171875, 2.32598876953125, 2.531982421875, 2.73797607421875, 2.9439697265625, 3.14996337890625, 3.35595703125, 3.56195068359375, 3.7679443359375, 3.97393798828125, 4.179931640625, 4.38592529296875, 4.5919189453125, 4.79791259765625, 5.00390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 8.0, 8.0, 12.0, 15.0, 23.0, 28.0, 42.0, 57.0, 82.0, 151.0, 289.0, 513.0, 1118.0, 2695.0, 8061.0, 40158.0, 535798.0, 413654.0, 33860.0, 7312.0, 2466.0, 1018.0, 506.0, 257.0, 151.0, 75.0, 59.0, 34.0, 25.0, 25.0, 12.0, 8.0, 5.0, 4.0, 4.0, 5.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-13.6875, -13.284423828125, -12.88134765625, -12.478271484375, -12.0751953125, -11.672119140625, -11.26904296875, -10.865966796875, -10.462890625, -10.059814453125, -9.65673828125, -9.253662109375, -8.8505859375, -8.447509765625, -8.04443359375, -7.641357421875, -7.23828125, -6.835205078125, -6.43212890625, -6.029052734375, -5.6259765625, -5.222900390625, -4.81982421875, -4.416748046875, -4.013671875, -3.610595703125, -3.20751953125, -2.804443359375, -2.4013671875, -1.998291015625, -1.59521484375, -1.192138671875, -0.7890625, -0.385986328125, 0.01708984375, 0.420166015625, 0.8232421875, 1.226318359375, 1.62939453125, 2.032470703125, 2.435546875, 2.838623046875, 3.24169921875, 3.644775390625, 4.0478515625, 4.450927734375, 4.85400390625, 5.257080078125, 5.66015625, 6.063232421875, 6.46630859375, 6.869384765625, 7.2724609375, 7.675537109375, 8.07861328125, 8.481689453125, 8.884765625, 9.287841796875, 9.69091796875, 10.093994140625, 10.4970703125, 10.900146484375, 11.30322265625, 11.706298828125, 12.109375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 1.0, 11.0, 17.0, 13.0, 25.0, 38.0, 44.0, 48.0, 47.0, 64.0, 69.0, 77.0, 68.0, 86.0, 57.0, 56.0, 59.0, 32.0, 50.0, 27.0, 20.0, 19.0, 17.0, 9.0, 6.0, 7.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.21875, -23.5556640625, -22.892578125, -22.2294921875, -21.56640625, -20.9033203125, -20.240234375, -19.5771484375, -18.9140625, -18.2509765625, -17.587890625, -16.9248046875, -16.26171875, -15.5986328125, -14.935546875, -14.2724609375, -13.609375, -12.9462890625, -12.283203125, -11.6201171875, -10.95703125, -10.2939453125, -9.630859375, -8.9677734375, -8.3046875, -7.6416015625, -6.978515625, -6.3154296875, -5.65234375, -4.9892578125, -4.326171875, -3.6630859375, -3.0, -2.3369140625, -1.673828125, -1.0107421875, -0.34765625, 0.3154296875, 0.978515625, 1.6416015625, 2.3046875, 2.9677734375, 3.630859375, 4.2939453125, 4.95703125, 5.6201171875, 6.283203125, 6.9462890625, 7.609375, 8.2724609375, 8.935546875, 9.5986328125, 10.26171875, 10.9248046875, 11.587890625, 12.2509765625, 12.9140625, 13.5771484375, 14.240234375, 14.9033203125, 15.56640625, 16.2294921875, 16.892578125, 17.5556640625, 18.21875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 5.0, 16.0, 13.0, 35.0, 38.0, 90.0, 152.0, 349.0, 779.0, 2601.0, 19950.0, 906366.0, 110236.0, 5689.0, 1275.0, 486.0, 204.0, 118.0, 48.0, 39.0, 17.0, 13.0, 13.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6171875, -6.3785400390625, -6.139892578125, -5.9012451171875, -5.66259765625, -5.4239501953125, -5.185302734375, -4.9466552734375, -4.7080078125, -4.4693603515625, -4.230712890625, -3.9920654296875, -3.75341796875, -3.5147705078125, -3.276123046875, -3.0374755859375, -2.798828125, -2.5601806640625, -2.321533203125, -2.0828857421875, -1.84423828125, -1.6055908203125, -1.366943359375, -1.1282958984375, -0.8896484375, -0.6510009765625, -0.412353515625, -0.1737060546875, 0.06494140625, 0.3035888671875, 0.542236328125, 0.7808837890625, 1.01953125, 1.2581787109375, 1.496826171875, 1.7354736328125, 1.97412109375, 2.2127685546875, 2.451416015625, 2.6900634765625, 2.9287109375, 3.1673583984375, 3.406005859375, 3.6446533203125, 3.88330078125, 4.1219482421875, 4.360595703125, 4.5992431640625, 4.837890625, 5.0765380859375, 5.315185546875, 5.5538330078125, 5.79248046875, 6.0311279296875, 6.269775390625, 6.5084228515625, 6.7470703125, 6.9857177734375, 7.224365234375, 7.4630126953125, 7.70166015625, 7.9403076171875, 8.178955078125, 8.4176025390625, 8.65625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 11.0, 9.0, 16.0, 25.0, 37.0, 69.0, 125.0, 190.0, 178.0, 106.0, 95.0, 52.0, 29.0, 18.0, 13.0, 6.0, 9.0, 7.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005855560302734375, -0.0005550086498260498, -0.0005244612693786621, -0.0004939138889312744, -0.0004633665084838867, -0.000432819128036499, -0.00040227174758911133, -0.00037172436714172363, -0.00034117698669433594, -0.00031062960624694824, -0.00028008222579956055, -0.00024953484535217285, -0.00021898746490478516, -0.00018844008445739746, -0.00015789270401000977, -0.00012734532356262207, -9.679794311523438e-05, -6.625056266784668e-05, -3.5703182220458984e-05, -5.155801773071289e-06, 2.5391578674316406e-05, 5.59389591217041e-05, 8.64863395690918e-05, 0.00011703372001647949, 0.0001475811004638672, 0.00017812848091125488, 0.00020867586135864258, 0.00023922324180603027, 0.00026977062225341797, 0.00030031800270080566, 0.00033086538314819336, 0.00036141276359558105, 0.00039196014404296875, 0.00042250752449035645, 0.00045305490493774414, 0.00048360228538513184, 0.0005141496658325195, 0.0005446970462799072, 0.0005752444267272949, 0.0006057918071746826, 0.0006363391876220703, 0.000666886568069458, 0.0006974339485168457, 0.0007279813289642334, 0.0007585287094116211, 0.0007890760898590088, 0.0008196234703063965, 0.0008501708507537842, 0.0008807182312011719, 0.0009112656116485596, 0.0009418129920959473, 0.000972360372543335, 0.0010029077529907227, 0.0010334551334381104, 0.001064002513885498, 0.0010945498943328857, 0.0011250972747802734, 0.0011556446552276611, 0.0011861920356750488, 0.0012167394161224365, 0.0012472867965698242, 0.001277834177017212, 0.0013083815574645996, 0.0013389289379119873, 0.001369476318359375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 13.0, 10.0, 27.0, 30.0, 55.0, 114.0, 219.0, 485.0, 1660.0, 8344.0, 164195.0, 839057.0, 29096.0, 3542.0, 939.0, 363.0, 158.0, 89.0, 66.0, 33.0, 15.0, 22.0, 10.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.32421875, -6.134033203125, -5.94384765625, -5.753662109375, -5.5634765625, -5.373291015625, -5.18310546875, -4.992919921875, -4.802734375, -4.612548828125, -4.42236328125, -4.232177734375, -4.0419921875, -3.851806640625, -3.66162109375, -3.471435546875, -3.28125, -3.091064453125, -2.90087890625, -2.710693359375, -2.5205078125, -2.330322265625, -2.14013671875, -1.949951171875, -1.759765625, -1.569580078125, -1.37939453125, -1.189208984375, -0.9990234375, -0.808837890625, -0.61865234375, -0.428466796875, -0.23828125, -0.048095703125, 0.14208984375, 0.332275390625, 0.5224609375, 0.712646484375, 0.90283203125, 1.093017578125, 1.283203125, 1.473388671875, 1.66357421875, 1.853759765625, 2.0439453125, 2.234130859375, 2.42431640625, 2.614501953125, 2.8046875, 2.994873046875, 3.18505859375, 3.375244140625, 3.5654296875, 3.755615234375, 3.94580078125, 4.135986328125, 4.326171875, 4.516357421875, 4.70654296875, 4.896728515625, 5.0869140625, 5.277099609375, 5.46728515625, 5.657470703125, 5.84765625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 20.0, 22.0, 28.0, 58.0, 114.0, 174.0, 179.0, 147.0, 98.0, 65.0, 30.0, 22.0, 9.0, 10.0, 6.0, 1.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7421875, -8.50115966796875, -8.2601318359375, -8.01910400390625, -7.778076171875, -7.53704833984375, -7.2960205078125, -7.05499267578125, -6.81396484375, -6.57293701171875, -6.3319091796875, -6.09088134765625, -5.849853515625, -5.60882568359375, -5.3677978515625, -5.12677001953125, -4.8857421875, -4.64471435546875, -4.4036865234375, -4.16265869140625, -3.921630859375, -3.68060302734375, -3.4395751953125, -3.19854736328125, -2.95751953125, -2.71649169921875, -2.4754638671875, -2.23443603515625, -1.993408203125, -1.75238037109375, -1.5113525390625, -1.27032470703125, -1.029296875, -0.78826904296875, -0.5472412109375, -0.30621337890625, -0.065185546875, 0.17584228515625, 0.4168701171875, 0.65789794921875, 0.89892578125, 1.13995361328125, 1.3809814453125, 1.62200927734375, 1.863037109375, 2.10406494140625, 2.3450927734375, 2.58612060546875, 2.8271484375, 3.06817626953125, 3.3092041015625, 3.55023193359375, 3.791259765625, 4.03228759765625, 4.2733154296875, 4.51434326171875, 4.75537109375, 4.99639892578125, 5.2374267578125, 5.47845458984375, 5.719482421875, 5.96051025390625, 6.2015380859375, 6.44256591796875, 6.68359375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 10.0, 26.0, 89.0, 235.0, 387.0, 183.0, 49.0, 22.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-187.52291870117188, -181.35804748535156, -175.19317626953125, -169.02830505371094, -162.86343383789062, -156.69857788085938, -150.53370666503906, -144.36883544921875, -138.20396423339844, -132.03909301757812, -125.87422180175781, -119.70935821533203, -113.54448699951172, -107.3796157836914, -101.21475219726562, -95.04988098144531, -88.885009765625, -82.72013854980469, -76.55526733398438, -70.3904037475586, -64.22553253173828, -58.06066131591797, -51.89579391479492, -45.730926513671875, -39.56605529785156, -33.40118408203125, -27.236316680908203, -21.071447372436523, -14.906578063964844, -8.741708755493164, -2.5768394470214844, 3.5880279541015625, 9.752883911132812, 15.917753219604492, 22.082622528076172, 28.24749183654785, 34.41236114501953, 40.577232360839844, 46.74209976196289, 52.90696716308594, 59.07183837890625, 65.23670959472656, 71.40158081054688, 77.56644439697266, 83.73131561279297, 89.89618682861328, 96.06105041503906, 102.22592163085938, 108.39079284667969, 114.5556640625, 120.72053527832031, 126.8853988647461, 133.05026245117188, 139.2151336669922, 145.3800048828125, 151.5448760986328, 157.70974731445312, 163.87461853027344, 170.03948974609375, 176.20436096191406, 182.36923217773438, 188.53408813476562, 194.69895935058594, 200.86383056640625, 207.02870178222656]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 2.0, 4.0, 6.0, 7.0, 10.0, 13.0, 26.0, 23.0, 34.0, 31.0, 36.0, 48.0, 48.0, 51.0, 62.0, 70.0, 58.0, 68.0, 73.0, 62.0, 45.0, 44.0, 39.0, 29.0, 20.0, 20.0, 16.0, 8.0, 14.0, 7.0, 7.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.3236083984375, -84.543212890625, -81.76280975341797, -78.98241424560547, -76.20201110839844, -73.42161560058594, -70.64122009277344, -67.8608169555664, -65.0804214477539, -62.30002212524414, -59.519622802734375, -56.739227294921875, -53.95882797241211, -51.178428649902344, -48.39802932739258, -45.61763000488281, -42.83723068237305, -40.05683135986328, -37.276432037353516, -34.49603271484375, -31.71563720703125, -28.935237884521484, -26.15483856201172, -23.374441146850586, -20.59404182434082, -17.813642501831055, -15.033245086669922, -12.252845764160156, -9.472447395324707, -6.692049026489258, -3.911649703979492, -1.1312522888183594, 1.6491470336914062, 4.4295454025268555, 7.209944248199463, 9.99034309387207, 12.77074146270752, 15.551139831542969, 18.331539154052734, 21.111936569213867, 23.892335891723633, 26.6727352142334, 29.45313262939453, 32.2335319519043, 35.01393127441406, 37.79432678222656, 40.574729919433594, 43.355125427246094, 46.13552474975586, 48.915924072265625, 51.69632339477539, 54.476722717285156, 57.257118225097656, 60.03751754760742, 62.81791687011719, 65.59831237792969, 68.37871551513672, 71.15911102294922, 73.93951416015625, 76.71990966796875, 79.50031280517578, 82.28070831298828, 85.06111145019531, 87.84150695800781, 90.62190246582031]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 8.0, 10.0, 9.0, 21.0, 37.0, 58.0, 96.0, 135.0, 265.0, 496.0, 1099.0, 2725.0, 8580.0, 36180.0, 644746.0, 3415267.0, 64495.0, 12953.0, 3931.0, 1536.0, 724.0, 362.0, 222.0, 106.0, 60.0, 39.0, 39.0, 24.0, 13.0, 13.0, 11.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.0234375, -7.7659912109375, -7.508544921875, -7.2510986328125, -6.99365234375, -6.7362060546875, -6.478759765625, -6.2213134765625, -5.9638671875, -5.7064208984375, -5.448974609375, -5.1915283203125, -4.93408203125, -4.6766357421875, -4.419189453125, -4.1617431640625, -3.904296875, -3.6468505859375, -3.389404296875, -3.1319580078125, -2.87451171875, -2.6170654296875, -2.359619140625, -2.1021728515625, -1.8447265625, -1.5872802734375, -1.329833984375, -1.0723876953125, -0.81494140625, -0.5574951171875, -0.300048828125, -0.0426025390625, 0.21484375, 0.4722900390625, 0.729736328125, 0.9871826171875, 1.24462890625, 1.5020751953125, 1.759521484375, 2.0169677734375, 2.2744140625, 2.5318603515625, 2.789306640625, 3.0467529296875, 3.30419921875, 3.5616455078125, 3.819091796875, 4.0765380859375, 4.333984375, 4.5914306640625, 4.848876953125, 5.1063232421875, 5.36376953125, 5.6212158203125, 5.878662109375, 6.1361083984375, 6.3935546875, 6.6510009765625, 6.908447265625, 7.1658935546875, 7.42333984375, 7.6807861328125, 7.938232421875, 8.1956787109375, 8.453125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 10.0, 9.0, 14.0, 31.0, 31.0, 53.0, 56.0, 70.0, 91.0, 89.0, 109.0, 94.0, 91.0, 69.0, 49.0, 34.0, 31.0, 19.0, 18.0, 9.0, 4.0, 8.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.20703125, -4.0345458984375, -3.862060546875, -3.6895751953125, -3.51708984375, -3.3446044921875, -3.172119140625, -2.9996337890625, -2.8271484375, -2.6546630859375, -2.482177734375, -2.3096923828125, -2.13720703125, -1.9647216796875, -1.792236328125, -1.6197509765625, -1.447265625, -1.2747802734375, -1.102294921875, -0.9298095703125, -0.75732421875, -0.5848388671875, -0.412353515625, -0.2398681640625, -0.0673828125, 0.1051025390625, 0.277587890625, 0.4500732421875, 0.62255859375, 0.7950439453125, 0.967529296875, 1.1400146484375, 1.3125, 1.4849853515625, 1.657470703125, 1.8299560546875, 2.00244140625, 2.1749267578125, 2.347412109375, 2.5198974609375, 2.6923828125, 2.8648681640625, 3.037353515625, 3.2098388671875, 3.38232421875, 3.5548095703125, 3.727294921875, 3.8997802734375, 4.072265625, 4.2447509765625, 4.417236328125, 4.5897216796875, 4.76220703125, 4.9346923828125, 5.107177734375, 5.2796630859375, 5.4521484375, 5.6246337890625, 5.797119140625, 5.9696044921875, 6.14208984375, 6.3145751953125, 6.487060546875, 6.6595458984375, 6.83203125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 7.0, 13.0, 23.0, 22.0, 48.0, 88.0, 160.0, 327.0, 680.0, 1578.0, 4642.0, 17756.0, 130774.0, 3874290.0, 137297.0, 18648.0, 4753.0, 1738.0, 736.0, 314.0, 158.0, 91.0, 55.0, 31.0, 18.0, 9.0, 9.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5546875, -10.2197265625, -9.884765625, -9.5498046875, -9.21484375, -8.8798828125, -8.544921875, -8.2099609375, -7.875, -7.5400390625, -7.205078125, -6.8701171875, -6.53515625, -6.2001953125, -5.865234375, -5.5302734375, -5.1953125, -4.8603515625, -4.525390625, -4.1904296875, -3.85546875, -3.5205078125, -3.185546875, -2.8505859375, -2.515625, -2.1806640625, -1.845703125, -1.5107421875, -1.17578125, -0.8408203125, -0.505859375, -0.1708984375, 0.1640625, 0.4990234375, 0.833984375, 1.1689453125, 1.50390625, 1.8388671875, 2.173828125, 2.5087890625, 2.84375, 3.1787109375, 3.513671875, 3.8486328125, 4.18359375, 4.5185546875, 4.853515625, 5.1884765625, 5.5234375, 5.8583984375, 6.193359375, 6.5283203125, 6.86328125, 7.1982421875, 7.533203125, 7.8681640625, 8.203125, 8.5380859375, 8.873046875, 9.2080078125, 9.54296875, 9.8779296875, 10.212890625, 10.5478515625, 10.8828125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 11.0, 11.0, 18.0, 22.0, 34.0, 54.0, 83.0, 212.0, 715.0, 1801.0, 682.0, 177.0, 82.0, 48.0, 32.0, 18.0, 13.0, 17.0, 11.0, 8.0, 5.0, 0.0, 4.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.0, -9.6492919921875, -9.298583984375, -8.9478759765625, -8.59716796875, -8.2464599609375, -7.895751953125, -7.5450439453125, -7.1943359375, -6.8436279296875, -6.492919921875, -6.1422119140625, -5.79150390625, -5.4407958984375, -5.090087890625, -4.7393798828125, -4.388671875, -4.0379638671875, -3.687255859375, -3.3365478515625, -2.98583984375, -2.6351318359375, -2.284423828125, -1.9337158203125, -1.5830078125, -1.2322998046875, -0.881591796875, -0.5308837890625, -0.18017578125, 0.1705322265625, 0.521240234375, 0.8719482421875, 1.22265625, 1.5733642578125, 1.924072265625, 2.2747802734375, 2.62548828125, 2.9761962890625, 3.326904296875, 3.6776123046875, 4.0283203125, 4.3790283203125, 4.729736328125, 5.0804443359375, 5.43115234375, 5.7818603515625, 6.132568359375, 6.4832763671875, 6.833984375, 7.1846923828125, 7.535400390625, 7.8861083984375, 8.23681640625, 8.5875244140625, 8.938232421875, 9.2889404296875, 9.6396484375, 9.9903564453125, 10.341064453125, 10.6917724609375, 11.04248046875, 11.3931884765625, 11.743896484375, 12.0946044921875, 12.4453125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 14.0, 25.0, 36.0, 64.0, 151.0, 210.0, 245.0, 127.0, 56.0, 27.0, 19.0, 10.0, 4.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.55964660644531, -78.99602508544922, -76.43240356445312, -73.86878204345703, -71.30516052246094, -68.74153900146484, -66.17791748046875, -63.614295959472656, -61.05067443847656, -58.48705291748047, -55.923431396484375, -53.35980987548828, -50.79618835449219, -48.232566833496094, -45.6689453125, -43.105323791503906, -40.54170227050781, -37.97808074951172, -35.414459228515625, -32.85083770751953, -30.287216186523438, -27.723594665527344, -25.15997314453125, -22.596351623535156, -20.032730102539062, -17.46910858154297, -14.905487060546875, -12.341865539550781, -9.778244018554688, -7.214622497558594, -4.6510009765625, -2.0873794555664062, 0.47624969482421875, 3.0398712158203125, 5.603492736816406, 8.1671142578125, 10.730735778808594, 13.294357299804688, 15.857978820800781, 18.421600341796875, 20.98522186279297, 23.548843383789062, 26.112464904785156, 28.67608642578125, 31.239707946777344, 33.80332946777344, 36.36695098876953, 38.930572509765625, 41.49419403076172, 44.05781555175781, 46.621437072753906, 49.18505859375, 51.748680114746094, 54.31230163574219, 56.87592315673828, 59.439544677734375, 62.00316619873047, 64.56678771972656, 67.13040924072266, 69.69403076171875, 72.25765228271484, 74.82127380371094, 77.38489532470703, 79.94851684570312, 82.51213836669922]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 8.0, 9.0, 6.0, 9.0, 6.0, 7.0, 23.0, 25.0, 27.0, 33.0, 52.0, 42.0, 40.0, 46.0, 49.0, 47.0, 65.0, 53.0, 58.0, 59.0, 40.0, 40.0, 28.0, 38.0, 31.0, 36.0, 18.0, 21.0, 23.0, 13.0, 14.0, 8.0, 6.0, 11.0, 4.0, 0.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.01647186279297, -37.75933074951172, -36.50218963623047, -35.24504852294922, -33.98790740966797, -32.73076248168945, -31.473621368408203, -30.216480255126953, -28.959339141845703, -27.702198028564453, -26.445056915283203, -25.18791389465332, -23.93077278137207, -22.67363166809082, -21.416488647460938, -20.159347534179688, -18.902206420898438, -17.645065307617188, -16.387924194335938, -15.130781173706055, -13.873640060424805, -12.616498947143555, -11.359356880187988, -10.102214813232422, -8.845073699951172, -7.587932109832764, -6.3307905197143555, -5.073648929595947, -3.816507339477539, -2.559365749359131, -1.3022241592407227, -0.04508209228515625, 1.2120590209960938, 2.469200611114502, 3.72634220123291, 4.983483791351318, 6.240625381469727, 7.497766971588135, 8.754908561706543, 10.01205062866211, 11.26919174194336, 12.52633285522461, 13.783474922180176, 15.040616989135742, 16.297758102416992, 17.554899215698242, 18.812042236328125, 20.069183349609375, 21.326324462890625, 22.583465576171875, 23.840606689453125, 25.097749710083008, 26.354890823364258, 27.612031936645508, 28.86917495727539, 30.12631607055664, 31.38345718383789, 32.64059829711914, 33.89773941040039, 35.15488052368164, 36.412025451660156, 37.669166564941406, 38.926307678222656, 40.183448791503906, 41.440589904785156]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 9.0, 25.0, 17.0, 27.0, 55.0, 90.0, 158.0, 269.0, 492.0, 933.0, 1815.0, 3759.0, 8812.0, 22060.0, 61622.0, 194614.0, 451179.0, 200331.0, 62983.0, 22635.0, 8947.0, 3853.0, 1811.0, 911.0, 481.0, 245.0, 154.0, 86.0, 64.0, 41.0, 20.0, 13.0, 9.0, 11.0, 7.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.16796875, -6.99102783203125, -6.8140869140625, -6.63714599609375, -6.460205078125, -6.28326416015625, -6.1063232421875, -5.92938232421875, -5.75244140625, -5.57550048828125, -5.3985595703125, -5.22161865234375, -5.044677734375, -4.86773681640625, -4.6907958984375, -4.51385498046875, -4.3369140625, -4.15997314453125, -3.9830322265625, -3.80609130859375, -3.629150390625, -3.45220947265625, -3.2752685546875, -3.09832763671875, -2.92138671875, -2.74444580078125, -2.5675048828125, -2.39056396484375, -2.213623046875, -2.03668212890625, -1.8597412109375, -1.68280029296875, -1.505859375, -1.32891845703125, -1.1519775390625, -0.97503662109375, -0.798095703125, -0.62115478515625, -0.4442138671875, -0.26727294921875, -0.09033203125, 0.08660888671875, 0.2635498046875, 0.44049072265625, 0.617431640625, 0.79437255859375, 0.9713134765625, 1.14825439453125, 1.3251953125, 1.50213623046875, 1.6790771484375, 1.85601806640625, 2.032958984375, 2.20989990234375, 2.3868408203125, 2.56378173828125, 2.74072265625, 2.91766357421875, 3.0946044921875, 3.27154541015625, 3.448486328125, 3.62542724609375, 3.8023681640625, 3.97930908203125, 4.15625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 2.0, 9.0, 8.0, 11.0, 11.0, 27.0, 35.0, 42.0, 60.0, 61.0, 66.0, 84.0, 89.0, 99.0, 67.0, 71.0, 66.0, 45.0, 42.0, 26.0, 25.0, 10.0, 18.0, 12.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.155426025390625, -3.01202392578125, -2.868621826171875, -2.7252197265625, -2.581817626953125, -2.43841552734375, -2.295013427734375, -2.151611328125, -2.008209228515625, -1.86480712890625, -1.721405029296875, -1.5780029296875, -1.434600830078125, -1.29119873046875, -1.147796630859375, -1.00439453125, -0.860992431640625, -0.71759033203125, -0.574188232421875, -0.4307861328125, -0.287384033203125, -0.14398193359375, -0.000579833984375, 0.142822265625, 0.286224365234375, 0.42962646484375, 0.573028564453125, 0.7164306640625, 0.859832763671875, 1.00323486328125, 1.146636962890625, 1.2900390625, 1.433441162109375, 1.57684326171875, 1.720245361328125, 1.8636474609375, 2.007049560546875, 2.15045166015625, 2.293853759765625, 2.437255859375, 2.580657958984375, 2.72406005859375, 2.867462158203125, 3.0108642578125, 3.154266357421875, 3.29766845703125, 3.441070556640625, 3.58447265625, 3.727874755859375, 3.87127685546875, 4.014678955078125, 4.1580810546875, 4.301483154296875, 4.44488525390625, 4.588287353515625, 4.731689453125, 4.875091552734375, 5.01849365234375, 5.161895751953125, 5.3052978515625, 5.448699951171875, 5.59210205078125, 5.735504150390625, 5.87890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 15.0, 12.0, 23.0, 41.0, 62.0, 94.0, 152.0, 307.0, 578.0, 1176.0, 2805.0, 10021.0, 57741.0, 663540.0, 272958.0, 28877.0, 6219.0, 1990.0, 875.0, 420.0, 247.0, 140.0, 87.0, 44.0, 42.0, 19.0, 17.0, 11.0, 13.0, 5.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.3828125, -10.03466796875, -9.6865234375, -9.33837890625, -8.990234375, -8.64208984375, -8.2939453125, -7.94580078125, -7.59765625, -7.24951171875, -6.9013671875, -6.55322265625, -6.205078125, -5.85693359375, -5.5087890625, -5.16064453125, -4.8125, -4.46435546875, -4.1162109375, -3.76806640625, -3.419921875, -3.07177734375, -2.7236328125, -2.37548828125, -2.02734375, -1.67919921875, -1.3310546875, -0.98291015625, -0.634765625, -0.28662109375, 0.0615234375, 0.40966796875, 0.7578125, 1.10595703125, 1.4541015625, 1.80224609375, 2.150390625, 2.49853515625, 2.8466796875, 3.19482421875, 3.54296875, 3.89111328125, 4.2392578125, 4.58740234375, 4.935546875, 5.28369140625, 5.6318359375, 5.97998046875, 6.328125, 6.67626953125, 7.0244140625, 7.37255859375, 7.720703125, 8.06884765625, 8.4169921875, 8.76513671875, 9.11328125, 9.46142578125, 9.8095703125, 10.15771484375, 10.505859375, 10.85400390625, 11.2021484375, 11.55029296875, 11.8984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 10.0, 7.0, 6.0, 9.0, 13.0, 12.0, 15.0, 24.0, 23.0, 19.0, 50.0, 37.0, 42.0, 43.0, 41.0, 50.0, 65.0, 52.0, 54.0, 54.0, 49.0, 51.0, 52.0, 43.0, 31.0, 33.0, 30.0, 22.0, 13.0, 14.0, 10.0, 8.0, 7.0, 7.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.09375, -12.6490478515625, -12.204345703125, -11.7596435546875, -11.31494140625, -10.8702392578125, -10.425537109375, -9.9808349609375, -9.5361328125, -9.0914306640625, -8.646728515625, -8.2020263671875, -7.75732421875, -7.3126220703125, -6.867919921875, -6.4232177734375, -5.978515625, -5.5338134765625, -5.089111328125, -4.6444091796875, -4.19970703125, -3.7550048828125, -3.310302734375, -2.8656005859375, -2.4208984375, -1.9761962890625, -1.531494140625, -1.0867919921875, -0.64208984375, -0.1973876953125, 0.247314453125, 0.6920166015625, 1.13671875, 1.5814208984375, 2.026123046875, 2.4708251953125, 2.91552734375, 3.3602294921875, 3.804931640625, 4.2496337890625, 4.6943359375, 5.1390380859375, 5.583740234375, 6.0284423828125, 6.47314453125, 6.9178466796875, 7.362548828125, 7.8072509765625, 8.251953125, 8.6966552734375, 9.141357421875, 9.5860595703125, 10.03076171875, 10.4754638671875, 10.920166015625, 11.3648681640625, 11.8095703125, 12.2542724609375, 12.698974609375, 13.1436767578125, 13.58837890625, 14.0330810546875, 14.477783203125, 14.9224853515625, 15.3671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 3.0, 4.0, 6.0, 4.0, 6.0, 7.0, 14.0, 5.0, 17.0, 28.0, 28.0, 58.0, 69.0, 130.0, 272.0, 512.0, 1389.0, 5121.0, 56429.0, 939050.0, 38789.0, 4243.0, 1273.0, 495.0, 216.0, 131.0, 69.0, 56.0, 27.0, 29.0, 20.0, 13.0, 10.0, 7.0, 7.0, 9.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-6.328125, -6.11322021484375, -5.8983154296875, -5.68341064453125, -5.468505859375, -5.25360107421875, -5.0386962890625, -4.82379150390625, -4.60888671875, -4.39398193359375, -4.1790771484375, -3.96417236328125, -3.749267578125, -3.53436279296875, -3.3194580078125, -3.10455322265625, -2.8896484375, -2.67474365234375, -2.4598388671875, -2.24493408203125, -2.030029296875, -1.81512451171875, -1.6002197265625, -1.38531494140625, -1.17041015625, -0.95550537109375, -0.7406005859375, -0.52569580078125, -0.310791015625, -0.09588623046875, 0.1190185546875, 0.33392333984375, 0.548828125, 0.76373291015625, 0.9786376953125, 1.19354248046875, 1.408447265625, 1.62335205078125, 1.8382568359375, 2.05316162109375, 2.26806640625, 2.48297119140625, 2.6978759765625, 2.91278076171875, 3.127685546875, 3.34259033203125, 3.5574951171875, 3.77239990234375, 3.9873046875, 4.20220947265625, 4.4171142578125, 4.63201904296875, 4.846923828125, 5.06182861328125, 5.2767333984375, 5.49163818359375, 5.70654296875, 5.92144775390625, 6.1363525390625, 6.35125732421875, 6.566162109375, 6.78106689453125, 6.9959716796875, 7.21087646484375, 7.42578125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 12.0, 8.0, 12.0, 18.0, 39.0, 69.0, 115.0, 183.0, 186.0, 130.0, 94.0, 57.0, 29.0, 14.0, 6.0, 6.0, 3.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001522064208984375, -0.0014868155121803284, -0.0014515668153762817, -0.001416318118572235, -0.0013810694217681885, -0.0013458207249641418, -0.0013105720281600952, -0.0012753233313560486, -0.001240074634552002, -0.0012048259377479553, -0.0011695772409439087, -0.001134328544139862, -0.0010990798473358154, -0.0010638311505317688, -0.0010285824537277222, -0.0009933337569236755, -0.0009580850601196289, -0.0009228363633155823, -0.0008875876665115356, -0.000852338969707489, -0.0008170902729034424, -0.0007818415760993958, -0.0007465928792953491, -0.0007113441824913025, -0.0006760954856872559, -0.0006408467888832092, -0.0006055980920791626, -0.000570349395275116, -0.0005351006984710693, -0.0004998520016670227, -0.0004646033048629761, -0.00042935460805892944, -0.0003941059112548828, -0.0003588572144508362, -0.00032360851764678955, -0.0002883598208427429, -0.0002531111240386963, -0.00021786242723464966, -0.00018261373043060303, -0.0001473650336265564, -0.00011211633682250977, -7.686764001846313e-05, -4.1618943214416504e-05, -6.370246410369873e-06, 2.8878450393676758e-05, 6.412714719772339e-05, 9.937584400177002e-05, 0.00013462454080581665, 0.00016987323760986328, 0.0002051219344139099, 0.00024037063121795654, 0.0002756193280220032, 0.0003108680248260498, 0.00034611672163009644, 0.00038136541843414307, 0.0004166141152381897, 0.00045186281204223633, 0.00048711150884628296, 0.0005223602056503296, 0.0005576089024543762, 0.0005928575992584229, 0.0006281062960624695, 0.0006633549928665161, 0.0006986036896705627, 0.0007338523864746094]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 8.0, 15.0, 22.0, 37.0, 42.0, 57.0, 134.0, 217.0, 456.0, 1111.0, 3576.0, 14919.0, 153741.0, 810456.0, 51870.0, 8024.0, 2176.0, 872.0, 367.0, 185.0, 93.0, 58.0, 38.0, 18.0, 16.0, 11.0, 1.0, 6.0, 7.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.51171875, -5.363983154296875, -5.21624755859375, -5.068511962890625, -4.9207763671875, -4.773040771484375, -4.62530517578125, -4.477569580078125, -4.329833984375, -4.182098388671875, -4.03436279296875, -3.886627197265625, -3.7388916015625, -3.591156005859375, -3.44342041015625, -3.295684814453125, -3.14794921875, -3.000213623046875, -2.85247802734375, -2.704742431640625, -2.5570068359375, -2.409271240234375, -2.26153564453125, -2.113800048828125, -1.966064453125, -1.818328857421875, -1.67059326171875, -1.522857666015625, -1.3751220703125, -1.227386474609375, -1.07965087890625, -0.931915283203125, -0.7841796875, -0.636444091796875, -0.48870849609375, -0.340972900390625, -0.1932373046875, -0.045501708984375, 0.10223388671875, 0.249969482421875, 0.397705078125, 0.545440673828125, 0.69317626953125, 0.840911865234375, 0.9886474609375, 1.136383056640625, 1.28411865234375, 1.431854248046875, 1.57958984375, 1.727325439453125, 1.87506103515625, 2.022796630859375, 2.1705322265625, 2.318267822265625, 2.46600341796875, 2.613739013671875, 2.761474609375, 2.909210205078125, 3.05694580078125, 3.204681396484375, 3.3524169921875, 3.500152587890625, 3.64788818359375, 3.795623779296875, 3.943359375]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 10.0, 3.0, 13.0, 10.0, 11.0, 12.0, 30.0, 36.0, 51.0, 58.0, 69.0, 85.0, 95.0, 115.0, 74.0, 80.0, 61.0, 35.0, 41.0, 17.0, 22.0, 12.0, 10.0, 12.0, 7.0, 9.0, 5.0, 2.0, 4.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-4.9375, -4.80828857421875, -4.6790771484375, -4.54986572265625, -4.420654296875, -4.29144287109375, -4.1622314453125, -4.03302001953125, -3.90380859375, -3.77459716796875, -3.6453857421875, -3.51617431640625, -3.386962890625, -3.25775146484375, -3.1285400390625, -2.99932861328125, -2.8701171875, -2.74090576171875, -2.6116943359375, -2.48248291015625, -2.353271484375, -2.22406005859375, -2.0948486328125, -1.96563720703125, -1.83642578125, -1.70721435546875, -1.5780029296875, -1.44879150390625, -1.319580078125, -1.19036865234375, -1.0611572265625, -0.93194580078125, -0.802734375, -0.67352294921875, -0.5443115234375, -0.41510009765625, -0.285888671875, -0.15667724609375, -0.0274658203125, 0.10174560546875, 0.23095703125, 0.36016845703125, 0.4893798828125, 0.61859130859375, 0.747802734375, 0.87701416015625, 1.0062255859375, 1.13543701171875, 1.2646484375, 1.39385986328125, 1.5230712890625, 1.65228271484375, 1.781494140625, 1.91070556640625, 2.0399169921875, 2.16912841796875, 2.29833984375, 2.42755126953125, 2.5567626953125, 2.68597412109375, 2.815185546875, 2.94439697265625, 3.0736083984375, 3.20281982421875, 3.33203125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 3.0, 7.0, 13.0, 18.0, 34.0, 48.0, 83.0, 113.0, 166.0, 170.0, 139.0, 76.0, 49.0, 30.0, 17.0, 10.0, 6.0, 4.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.78399658203125, -69.66683959960938, -67.54967498779297, -65.4325180053711, -63.31535720825195, -61.19819641113281, -59.08103561401367, -56.96387481689453, -54.846717834472656, -52.729557037353516, -50.612396240234375, -48.4952392578125, -46.37807846069336, -44.26091766357422, -42.14375686645508, -40.02659606933594, -37.9094352722168, -35.792274475097656, -33.675113677978516, -31.557954788208008, -29.4407958984375, -27.32363510131836, -25.20647430419922, -23.089313507080078, -20.97215461730957, -18.85499382019043, -16.737834930419922, -14.620674133300781, -12.503514289855957, -10.386354446411133, -8.269193649291992, -6.152033805847168, -4.034873962402344, -1.9177138805389404, 0.1994462013244629, 2.3166065216064453, 4.4337663650512695, 6.550926208496094, 8.668087005615234, 10.785246849060059, 12.902406692504883, 15.019566535949707, 17.13672637939453, 19.253887176513672, 21.371047973632812, 23.48820686340332, 25.60536766052246, 27.72252655029297, 29.83968734741211, 31.95684814453125, 34.07400894165039, 36.19116973876953, 38.308326721191406, 40.42548751831055, 42.54264831542969, 44.65980911254883, 46.77696990966797, 48.89413070678711, 51.01129150390625, 53.128448486328125, 55.245609283447266, 57.362770080566406, 59.47993087768555, 61.59709167480469, 63.71424865722656]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 6.0, 6.0, 19.0, 11.0, 12.0, 20.0, 30.0, 35.0, 44.0, 56.0, 55.0, 69.0, 90.0, 82.0, 91.0, 76.0, 53.0, 42.0, 48.0, 38.0, 29.0, 24.0, 11.0, 11.0, 12.0, 9.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-94.86015319824219, -92.39710235595703, -89.93405151367188, -87.47100067138672, -85.00794982910156, -82.5448989868164, -80.08184814453125, -77.61880493164062, -75.15574645996094, -72.69269561767578, -70.22964477539062, -67.76659393310547, -65.30354309082031, -62.840492248535156, -60.377445220947266, -57.91439437866211, -55.45134735107422, -52.98829650878906, -50.525245666503906, -48.06219482421875, -45.599143981933594, -43.13609313964844, -40.67304611206055, -38.20999526977539, -35.746944427490234, -33.28389358520508, -30.820842742919922, -28.3577938079834, -25.894742965698242, -23.431692123413086, -20.968643188476562, -18.505592346191406, -16.04254150390625, -13.579490661621094, -11.116440773010254, -8.653390884399414, -6.190340042114258, -3.7272891998291016, -1.2642393112182617, 1.1988105773925781, 3.6618614196777344, 6.124911785125732, 8.58796215057373, 11.05101203918457, 13.514062881469727, 15.977113723754883, 18.440162658691406, 20.903213500976562, 23.36626434326172, 25.829315185546875, 28.29236602783203, 30.755414962768555, 33.218467712402344, 35.6815185546875, 38.14456558227539, 40.60761642456055, 43.0706672668457, 45.53371810913086, 47.996768951416016, 50.45981979370117, 52.92286682128906, 55.38591766357422, 57.848968505859375, 60.31201934814453, 62.77507019042969]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 3.0, 4.0, 6.0, 8.0, 6.0, 8.0, 11.0, 20.0, 20.0, 21.0, 33.0, 55.0, 65.0, 117.0, 229.0, 549.0, 1830.0, 7170.0, 44744.0, 3746750.0, 371394.0, 15495.0, 3297.0, 1097.0, 509.0, 275.0, 167.0, 95.0, 79.0, 68.0, 35.0, 24.0, 30.0, 20.0, 16.0, 14.0, 9.0, 2.0, 1.0, 3.0, 5.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.546875, -10.2252197265625, -9.903564453125, -9.5819091796875, -9.26025390625, -8.9385986328125, -8.616943359375, -8.2952880859375, -7.9736328125, -7.6519775390625, -7.330322265625, -7.0086669921875, -6.68701171875, -6.3653564453125, -6.043701171875, -5.7220458984375, -5.400390625, -5.0787353515625, -4.757080078125, -4.4354248046875, -4.11376953125, -3.7921142578125, -3.470458984375, -3.1488037109375, -2.8271484375, -2.5054931640625, -2.183837890625, -1.8621826171875, -1.54052734375, -1.2188720703125, -0.897216796875, -0.5755615234375, -0.25390625, 0.0677490234375, 0.389404296875, 0.7110595703125, 1.03271484375, 1.3543701171875, 1.676025390625, 1.9976806640625, 2.3193359375, 2.6409912109375, 2.962646484375, 3.2843017578125, 3.60595703125, 3.9276123046875, 4.249267578125, 4.5709228515625, 4.892578125, 5.2142333984375, 5.535888671875, 5.8575439453125, 6.17919921875, 6.5008544921875, 6.822509765625, 7.1441650390625, 7.4658203125, 7.7874755859375, 8.109130859375, 8.4307861328125, 8.75244140625, 9.0740966796875, 9.395751953125, 9.7174072265625, 10.0390625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 23.0, 33.0, 50.0, 74.0, 98.0, 122.0, 133.0, 126.0, 104.0, 89.0, 38.0, 35.0, 30.0, 21.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.130859375, -2.920562744140625, -2.71026611328125, -2.499969482421875, -2.2896728515625, -2.079376220703125, -1.86907958984375, -1.658782958984375, -1.448486328125, -1.238189697265625, -1.02789306640625, -0.817596435546875, -0.6072998046875, -0.397003173828125, -0.18670654296875, 0.023590087890625, 0.23388671875, 0.444183349609375, 0.65447998046875, 0.864776611328125, 1.0750732421875, 1.285369873046875, 1.49566650390625, 1.705963134765625, 1.916259765625, 2.126556396484375, 2.33685302734375, 2.547149658203125, 2.7574462890625, 2.967742919921875, 3.17803955078125, 3.388336181640625, 3.5986328125, 3.808929443359375, 4.01922607421875, 4.229522705078125, 4.4398193359375, 4.650115966796875, 4.86041259765625, 5.070709228515625, 5.281005859375, 5.491302490234375, 5.70159912109375, 5.911895751953125, 6.1221923828125, 6.332489013671875, 6.54278564453125, 6.753082275390625, 6.96337890625, 7.173675537109375, 7.38397216796875, 7.594268798828125, 7.8045654296875, 8.014862060546875, 8.22515869140625, 8.435455322265625, 8.645751953125, 8.856048583984375, 9.06634521484375, 9.276641845703125, 9.4869384765625, 9.697235107421875, 9.90753173828125, 10.117828369140625, 10.328125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 4.0, 4.0, 9.0, 3.0, 17.0, 14.0, 32.0, 55.0, 78.0, 125.0, 179.0, 360.0, 685.0, 1649.0, 4586.0, 17940.0, 143589.0, 3888579.0, 113834.0, 15885.0, 4059.0, 1384.0, 604.0, 273.0, 143.0, 83.0, 42.0, 28.0, 18.0, 9.0, 6.0, 7.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-14.078125, -13.73858642578125, -13.3990478515625, -13.05950927734375, -12.719970703125, -12.38043212890625, -12.0408935546875, -11.70135498046875, -11.36181640625, -11.02227783203125, -10.6827392578125, -10.34320068359375, -10.003662109375, -9.66412353515625, -9.3245849609375, -8.98504638671875, -8.6455078125, -8.30596923828125, -7.9664306640625, -7.62689208984375, -7.287353515625, -6.94781494140625, -6.6082763671875, -6.26873779296875, -5.92919921875, -5.58966064453125, -5.2501220703125, -4.91058349609375, -4.571044921875, -4.23150634765625, -3.8919677734375, -3.55242919921875, -3.212890625, -2.87335205078125, -2.5338134765625, -2.19427490234375, -1.854736328125, -1.51519775390625, -1.1756591796875, -0.83612060546875, -0.49658203125, -0.15704345703125, 0.1824951171875, 0.52203369140625, 0.861572265625, 1.20111083984375, 1.5406494140625, 1.88018798828125, 2.2197265625, 2.55926513671875, 2.8988037109375, 3.23834228515625, 3.577880859375, 3.91741943359375, 4.2569580078125, 4.59649658203125, 4.93603515625, 5.27557373046875, 5.6151123046875, 5.95465087890625, 6.294189453125, 6.63372802734375, 6.9732666015625, 7.31280517578125, 7.65234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 4.0, 7.0, 10.0, 12.0, 15.0, 34.0, 44.0, 95.0, 229.0, 891.0, 1835.0, 569.0, 144.0, 57.0, 45.0, 21.0, 20.0, 13.0, 11.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.5625, -16.197265625, -15.83203125, -15.466796875, -15.1015625, -14.736328125, -14.37109375, -14.005859375, -13.640625, -13.275390625, -12.91015625, -12.544921875, -12.1796875, -11.814453125, -11.44921875, -11.083984375, -10.71875, -10.353515625, -9.98828125, -9.623046875, -9.2578125, -8.892578125, -8.52734375, -8.162109375, -7.796875, -7.431640625, -7.06640625, -6.701171875, -6.3359375, -5.970703125, -5.60546875, -5.240234375, -4.875, -4.509765625, -4.14453125, -3.779296875, -3.4140625, -3.048828125, -2.68359375, -2.318359375, -1.953125, -1.587890625, -1.22265625, -0.857421875, -0.4921875, -0.126953125, 0.23828125, 0.603515625, 0.96875, 1.333984375, 1.69921875, 2.064453125, 2.4296875, 2.794921875, 3.16015625, 3.525390625, 3.890625, 4.255859375, 4.62109375, 4.986328125, 5.3515625, 5.716796875, 6.08203125, 6.447265625, 6.8125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 16.0, 44.0, 157.0, 370.0, 259.0, 96.0, 35.0, 12.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.74002838134766, -87.0778579711914, -83.41568756103516, -79.7535171508789, -76.09133911132812, -72.42916870117188, -68.76699829101562, -65.10482788085938, -61.442657470703125, -57.780487060546875, -54.118316650390625, -50.45614242553711, -46.79397201538086, -43.13180160522461, -39.469627380371094, -35.807456970214844, -32.145286560058594, -28.483116149902344, -24.82094383239746, -21.158771514892578, -17.496601104736328, -13.834430694580078, -10.172258377075195, -6.5100860595703125, -2.8479156494140625, 0.8142557144165039, 4.47642707824707, 8.138598442077637, 11.800769805908203, 15.462940216064453, 19.125112533569336, 22.78728485107422, 26.449462890625, 30.11163330078125, 33.7738037109375, 37.435977935791016, 41.098148345947266, 44.760318756103516, 48.42249298095703, 52.08466339111328, 55.74683380126953, 59.40900421142578, 63.07117462158203, 66.73334503173828, 70.39552307128906, 74.05769348144531, 77.71986389160156, 81.38203430175781, 85.04420471191406, 88.70637512207031, 92.36854553222656, 96.03071594238281, 99.69288635253906, 103.35505676269531, 107.0172348022461, 110.67940521240234, 114.3415756225586, 118.00374603271484, 121.6659164428711, 125.32808685302734, 128.99026489257812, 132.65243530273438, 136.31460571289062, 139.97677612304688, 143.63894653320312]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 6.0, 7.0, 8.0, 10.0, 13.0, 20.0, 29.0, 27.0, 29.0, 59.0, 46.0, 57.0, 63.0, 66.0, 65.0, 71.0, 61.0, 69.0, 57.0, 53.0, 46.0, 33.0, 28.0, 28.0, 20.0, 11.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0], "bins": [-70.87564086914062, -69.24797058105469, -67.62030029296875, -65.99263000488281, -64.36495971679688, -62.73728942871094, -61.109619140625, -59.48194885253906, -57.854278564453125, -56.22660827636719, -54.59893798828125, -52.97126770019531, -51.343597412109375, -49.71592712402344, -48.0882568359375, -46.46058654785156, -44.832916259765625, -43.20524597167969, -41.57757568359375, -39.94990539550781, -38.322235107421875, -36.69456481933594, -35.06689453125, -33.43922424316406, -31.81155776977539, -30.183887481689453, -28.556217193603516, -26.928546905517578, -25.30087661743164, -23.673206329345703, -22.045536041259766, -20.417865753173828, -18.79019546508789, -17.162525177001953, -15.534854888916016, -13.907184600830078, -12.27951431274414, -10.65184497833252, -9.024174690246582, -7.3965044021606445, -5.768834114074707, -4.1411638259887695, -2.513493776321411, -0.8858237266540527, 0.7418465614318848, 2.369516372680664, 3.9971866607666016, 5.624856948852539, 7.252527236938477, 8.880197525024414, 10.507867813110352, 12.135538101196289, 13.763208389282227, 15.390877723693848, 17.01854705810547, 18.646217346191406, 20.273887634277344, 21.90155792236328, 23.52922821044922, 25.156898498535156, 26.784568786621094, 28.41223907470703, 30.03990936279297, 31.667579650878906, 33.295249938964844]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 4.0, 10.0, 15.0, 20.0, 29.0, 64.0, 85.0, 144.0, 263.0, 509.0, 1053.0, 2173.0, 5587.0, 14529.0, 42630.0, 145543.0, 482679.0, 249291.0, 67897.0, 22099.0, 7796.0, 3239.0, 1423.0, 620.0, 347.0, 205.0, 113.0, 62.0, 54.0, 30.0, 16.0, 9.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.640625, -7.44317626953125, -7.2457275390625, -7.04827880859375, -6.850830078125, -6.65338134765625, -6.4559326171875, -6.25848388671875, -6.06103515625, -5.86358642578125, -5.6661376953125, -5.46868896484375, -5.271240234375, -5.07379150390625, -4.8763427734375, -4.67889404296875, -4.4814453125, -4.28399658203125, -4.0865478515625, -3.88909912109375, -3.691650390625, -3.49420166015625, -3.2967529296875, -3.09930419921875, -2.90185546875, -2.70440673828125, -2.5069580078125, -2.30950927734375, -2.112060546875, -1.91461181640625, -1.7171630859375, -1.51971435546875, -1.322265625, -1.12481689453125, -0.9273681640625, -0.72991943359375, -0.532470703125, -0.33502197265625, -0.1375732421875, 0.05987548828125, 0.25732421875, 0.45477294921875, 0.6522216796875, 0.84967041015625, 1.047119140625, 1.24456787109375, 1.4420166015625, 1.63946533203125, 1.8369140625, 2.03436279296875, 2.2318115234375, 2.42926025390625, 2.626708984375, 2.82415771484375, 3.0216064453125, 3.21905517578125, 3.41650390625, 3.61395263671875, 3.8114013671875, 4.00885009765625, 4.206298828125, 4.40374755859375, 4.6011962890625, 4.79864501953125, 4.99609375]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 8.0, 7.0, 11.0, 11.0, 12.0, 26.0, 27.0, 49.0, 73.0, 62.0, 88.0, 85.0, 76.0, 90.0, 59.0, 64.0, 59.0, 42.0, 36.0, 35.0, 23.0, 15.0, 19.0, 8.0, 10.0, 3.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.48828125, -3.34210205078125, -3.1959228515625, -3.04974365234375, -2.903564453125, -2.75738525390625, -2.6112060546875, -2.46502685546875, -2.31884765625, -2.17266845703125, -2.0264892578125, -1.88031005859375, -1.734130859375, -1.58795166015625, -1.4417724609375, -1.29559326171875, -1.1494140625, -1.00323486328125, -0.8570556640625, -0.71087646484375, -0.564697265625, -0.41851806640625, -0.2723388671875, -0.12615966796875, 0.02001953125, 0.16619873046875, 0.3123779296875, 0.45855712890625, 0.604736328125, 0.75091552734375, 0.8970947265625, 1.04327392578125, 1.189453125, 1.33563232421875, 1.4818115234375, 1.62799072265625, 1.774169921875, 1.92034912109375, 2.0665283203125, 2.21270751953125, 2.35888671875, 2.50506591796875, 2.6512451171875, 2.79742431640625, 2.943603515625, 3.08978271484375, 3.2359619140625, 3.38214111328125, 3.5283203125, 3.67449951171875, 3.8206787109375, 3.96685791015625, 4.113037109375, 4.25921630859375, 4.4053955078125, 4.55157470703125, 4.69775390625, 4.84393310546875, 4.9901123046875, 5.13629150390625, 5.282470703125, 5.42864990234375, 5.5748291015625, 5.72100830078125, 5.8671875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 6.0, 10.0, 12.0, 18.0, 16.0, 21.0, 34.0, 48.0, 61.0, 99.0, 157.0, 297.0, 537.0, 931.0, 2022.0, 5258.0, 18246.0, 97792.0, 698000.0, 183541.0, 28832.0, 7199.0, 2621.0, 1179.0, 607.0, 344.0, 201.0, 136.0, 97.0, 70.0, 43.0, 32.0, 26.0, 16.0, 15.0, 8.0, 6.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-11.125, -10.803955078125, -10.48291015625, -10.161865234375, -9.8408203125, -9.519775390625, -9.19873046875, -8.877685546875, -8.556640625, -8.235595703125, -7.91455078125, -7.593505859375, -7.2724609375, -6.951416015625, -6.63037109375, -6.309326171875, -5.98828125, -5.667236328125, -5.34619140625, -5.025146484375, -4.7041015625, -4.383056640625, -4.06201171875, -3.740966796875, -3.419921875, -3.098876953125, -2.77783203125, -2.456787109375, -2.1357421875, -1.814697265625, -1.49365234375, -1.172607421875, -0.8515625, -0.530517578125, -0.20947265625, 0.111572265625, 0.4326171875, 0.753662109375, 1.07470703125, 1.395751953125, 1.716796875, 2.037841796875, 2.35888671875, 2.679931640625, 3.0009765625, 3.322021484375, 3.64306640625, 3.964111328125, 4.28515625, 4.606201171875, 4.92724609375, 5.248291015625, 5.5693359375, 5.890380859375, 6.21142578125, 6.532470703125, 6.853515625, 7.174560546875, 7.49560546875, 7.816650390625, 8.1376953125, 8.458740234375, 8.77978515625, 9.100830078125, 9.421875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 10.0, 4.0, 10.0, 15.0, 16.0, 20.0, 34.0, 20.0, 43.0, 42.0, 51.0, 51.0, 60.0, 65.0, 64.0, 66.0, 54.0, 79.0, 57.0, 41.0, 34.0, 34.0, 22.0, 30.0, 16.0, 13.0, 12.0, 8.0, 8.0, 6.0, 7.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.171875, -16.660400390625, -16.14892578125, -15.637451171875, -15.1259765625, -14.614501953125, -14.10302734375, -13.591552734375, -13.080078125, -12.568603515625, -12.05712890625, -11.545654296875, -11.0341796875, -10.522705078125, -10.01123046875, -9.499755859375, -8.98828125, -8.476806640625, -7.96533203125, -7.453857421875, -6.9423828125, -6.430908203125, -5.91943359375, -5.407958984375, -4.896484375, -4.385009765625, -3.87353515625, -3.362060546875, -2.8505859375, -2.339111328125, -1.82763671875, -1.316162109375, -0.8046875, -0.293212890625, 0.21826171875, 0.729736328125, 1.2412109375, 1.752685546875, 2.26416015625, 2.775634765625, 3.287109375, 3.798583984375, 4.31005859375, 4.821533203125, 5.3330078125, 5.844482421875, 6.35595703125, 6.867431640625, 7.37890625, 7.890380859375, 8.40185546875, 8.913330078125, 9.4248046875, 9.936279296875, 10.44775390625, 10.959228515625, 11.470703125, 11.982177734375, 12.49365234375, 13.005126953125, 13.5166015625, 14.028076171875, 14.53955078125, 15.051025390625, 15.5625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 4.0, 8.0, 12.0, 24.0, 41.0, 60.0, 175.0, 378.0, 1417.0, 9585.0, 377334.0, 644308.0, 12805.0, 1625.0, 444.0, 147.0, 72.0, 36.0, 22.0, 8.0, 9.0, 13.0, 2.0, 4.0, 4.0, 3.0, 5.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37890625, -7.148681640625, -6.91845703125, -6.688232421875, -6.4580078125, -6.227783203125, -5.99755859375, -5.767333984375, -5.537109375, -5.306884765625, -5.07666015625, -4.846435546875, -4.6162109375, -4.385986328125, -4.15576171875, -3.925537109375, -3.6953125, -3.465087890625, -3.23486328125, -3.004638671875, -2.7744140625, -2.544189453125, -2.31396484375, -2.083740234375, -1.853515625, -1.623291015625, -1.39306640625, -1.162841796875, -0.9326171875, -0.702392578125, -0.47216796875, -0.241943359375, -0.01171875, 0.218505859375, 0.44873046875, 0.678955078125, 0.9091796875, 1.139404296875, 1.36962890625, 1.599853515625, 1.830078125, 2.060302734375, 2.29052734375, 2.520751953125, 2.7509765625, 2.981201171875, 3.21142578125, 3.441650390625, 3.671875, 3.902099609375, 4.13232421875, 4.362548828125, 4.5927734375, 4.822998046875, 5.05322265625, 5.283447265625, 5.513671875, 5.743896484375, 5.97412109375, 6.204345703125, 6.4345703125, 6.664794921875, 6.89501953125, 7.125244140625, 7.35546875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 13.0, 21.0, 18.0, 36.0, 53.0, 79.0, 106.0, 137.0, 153.0, 125.0, 89.0, 68.0, 33.0, 18.0, 14.0, 11.0, 8.0, 3.0, 6.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012035369873046875, -0.001172766089439392, -0.0011419951915740967, -0.0011112242937088013, -0.0010804533958435059, -0.0010496824979782104, -0.001018911600112915, -0.0009881407022476196, -0.0009573698043823242, -0.0009265989065170288, -0.0008958280086517334, -0.000865057110786438, -0.0008342862129211426, -0.0008035153150558472, -0.0007727444171905518, -0.0007419735193252563, -0.0007112026214599609, -0.0006804317235946655, -0.0006496608257293701, -0.0006188899278640747, -0.0005881190299987793, -0.0005573481321334839, -0.0005265772342681885, -0.0004958063364028931, -0.00046503543853759766, -0.00043426454067230225, -0.00040349364280700684, -0.0003727227449417114, -0.000341951847076416, -0.0003111809492111206, -0.0002804100513458252, -0.0002496391534805298, -0.00021886825561523438, -0.00018809735774993896, -0.00015732645988464355, -0.00012655556201934814, -9.578466415405273e-05, -6.501376628875732e-05, -3.4242868423461914e-05, -3.471970558166504e-06, 2.7298927307128906e-05, 5.8069825172424316e-05, 8.884072303771973e-05, 0.00011961162090301514, 0.00015038251876831055, 0.00018115341663360596, 0.00021192431449890137, 0.00024269521236419678, 0.0002734661102294922, 0.0003042370080947876, 0.000335007905960083, 0.0003657788038253784, 0.00039654970169067383, 0.00042732059955596924, 0.00045809149742126465, 0.0004888623952865601, 0.0005196332931518555, 0.0005504041910171509, 0.0005811750888824463, 0.0006119459867477417, 0.0006427168846130371, 0.0006734877824783325, 0.0007042586803436279, 0.0007350295782089233, 0.0007658004760742188]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 12.0, 20.0, 26.0, 49.0, 73.0, 147.0, 210.0, 451.0, 862.0, 2195.0, 7014.0, 43798.0, 651225.0, 309964.0, 24588.0, 4832.0, 1550.0, 713.0, 340.0, 168.0, 98.0, 68.0, 35.0, 32.0, 21.0, 18.0, 7.0, 7.0, 7.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.509765625, -3.379119873046875, -3.24847412109375, -3.117828369140625, -2.9871826171875, -2.856536865234375, -2.72589111328125, -2.595245361328125, -2.464599609375, -2.333953857421875, -2.20330810546875, -2.072662353515625, -1.9420166015625, -1.811370849609375, -1.68072509765625, -1.550079345703125, -1.41943359375, -1.288787841796875, -1.15814208984375, -1.027496337890625, -0.8968505859375, -0.766204833984375, -0.63555908203125, -0.504913330078125, -0.374267578125, -0.243621826171875, -0.11297607421875, 0.017669677734375, 0.1483154296875, 0.278961181640625, 0.40960693359375, 0.540252685546875, 0.6708984375, 0.801544189453125, 0.93218994140625, 1.062835693359375, 1.1934814453125, 1.324127197265625, 1.45477294921875, 1.585418701171875, 1.716064453125, 1.846710205078125, 1.97735595703125, 2.108001708984375, 2.2386474609375, 2.369293212890625, 2.49993896484375, 2.630584716796875, 2.76123046875, 2.891876220703125, 3.02252197265625, 3.153167724609375, 3.2838134765625, 3.414459228515625, 3.54510498046875, 3.675750732421875, 3.806396484375, 3.937042236328125, 4.06768798828125, 4.198333740234375, 4.3289794921875, 4.459625244140625, 4.59027099609375, 4.720916748046875, 4.8515625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 10.0, 12.0, 13.0, 20.0, 31.0, 52.0, 54.0, 80.0, 123.0, 123.0, 121.0, 104.0, 79.0, 60.0, 35.0, 29.0, 16.0, 14.0, 9.0, 4.0, 2.0, 6.0, 4.0, 4.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4765625, -3.3184814453125, -3.160400390625, -3.0023193359375, -2.84423828125, -2.6861572265625, -2.528076171875, -2.3699951171875, -2.2119140625, -2.0538330078125, -1.895751953125, -1.7376708984375, -1.57958984375, -1.4215087890625, -1.263427734375, -1.1053466796875, -0.947265625, -0.7891845703125, -0.631103515625, -0.4730224609375, -0.31494140625, -0.1568603515625, 0.001220703125, 0.1593017578125, 0.3173828125, 0.4754638671875, 0.633544921875, 0.7916259765625, 0.94970703125, 1.1077880859375, 1.265869140625, 1.4239501953125, 1.58203125, 1.7401123046875, 1.898193359375, 2.0562744140625, 2.21435546875, 2.3724365234375, 2.530517578125, 2.6885986328125, 2.8466796875, 3.0047607421875, 3.162841796875, 3.3209228515625, 3.47900390625, 3.6370849609375, 3.795166015625, 3.9532470703125, 4.111328125, 4.2694091796875, 4.427490234375, 4.5855712890625, 4.74365234375, 4.9017333984375, 5.059814453125, 5.2178955078125, 5.3759765625, 5.5340576171875, 5.692138671875, 5.8502197265625, 6.00830078125, 6.1663818359375, 6.324462890625, 6.4825439453125, 6.640625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 5.0, 8.0, 21.0, 43.0, 104.0, 184.0, 279.0, 177.0, 92.0, 48.0, 17.0, 9.0, 8.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.05712127685547, -64.08370971679688, -61.110294342041016, -58.13688278198242, -55.16346740722656, -52.19005584716797, -49.216644287109375, -46.24323272705078, -43.26981735229492, -40.29640579223633, -37.32299041748047, -34.349578857421875, -31.37616539001465, -28.402751922607422, -25.429340362548828, -22.4559268951416, -19.482513427734375, -16.50909996032715, -13.535687446594238, -10.562274932861328, -7.588861465454102, -4.615447998046875, -1.6420364379882812, 1.3313770294189453, 4.304790496826172, 7.27820348739624, 10.251616477966309, 13.225028991699219, 16.198442459106445, 19.171855926513672, 22.145267486572266, 25.118680953979492, 28.09210205078125, 31.065515518188477, 34.0389289855957, 37.0123405456543, 39.985755920410156, 42.95916748046875, 45.932579040527344, 48.90599060058594, 51.8794059753418, 54.85281753540039, 57.82623291015625, 60.799644470214844, 63.77305603027344, 66.74647521972656, 69.71987915039062, 72.69329833984375, 75.66670989990234, 78.64012145996094, 81.61353302001953, 84.58694458007812, 87.56036376953125, 90.53377532958984, 93.50718688964844, 96.48059844970703, 99.45401000976562, 102.42742156982422, 105.40083312988281, 108.37425231933594, 111.34766387939453, 114.32107543945312, 117.29448699951172, 120.26789855957031, 123.24131774902344]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 13.0, 24.0, 31.0, 56.0, 80.0, 81.0, 114.0, 148.0, 135.0, 79.0, 88.0, 35.0, 41.0, 27.0, 21.0, 6.0, 7.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.1026611328125, -99.24211883544922, -95.38158416748047, -91.52104187011719, -87.6604995727539, -83.79995727539062, -79.93942260742188, -76.0788803100586, -72.21833801269531, -68.35779571533203, -64.49726104736328, -60.63671875, -56.77617645263672, -52.9156379699707, -49.05509948730469, -45.194557189941406, -41.334022521972656, -37.47348403930664, -33.61294174194336, -29.752403259277344, -25.891862869262695, -22.031322479248047, -18.17078399658203, -14.310243606567383, -10.449703216552734, -6.589163303375244, -2.728623390197754, 1.1319160461425781, 4.992456436157227, 8.852996826171875, 12.71353530883789, 16.57407569885254, 20.434616088867188, 24.295156478881836, 28.155696868896484, 32.0162353515625, 35.87677764892578, 39.7373161315918, 43.59785461425781, 47.458396911621094, 51.31893539428711, 55.179473876953125, 59.040016174316406, 62.90055465698242, 66.76109313964844, 70.62163543701172, 74.482177734375, 78.34271240234375, 82.20325469970703, 86.06379699707031, 89.92433166503906, 93.78487396240234, 97.64541625976562, 101.50595092773438, 105.36649322509766, 109.22703552246094, 113.08757019042969, 116.94811248779297, 120.80864715576172, 124.669189453125, 128.52972412109375, 132.39027404785156, 136.2508087158203, 140.11134338378906, 143.97189331054688]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 26.0, 60.0, 150.0, 304.0, 497.0, 691.0, 1276.0, 2899.0, 12474.0, 145526.0, 3655831.0, 349895.0, 19652.0, 3425.0, 972.0, 262.0, 126.0, 47.0, 31.0, 23.0, 15.0, 11.0, 14.0, 10.0, 7.0, 9.0, 7.0, 10.0, 5.0, 3.0, 2.0, 4.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.328125, -4.0823974609375, -3.836669921875, -3.5909423828125, -3.34521484375, -3.0994873046875, -2.853759765625, -2.6080322265625, -2.3623046875, -2.1165771484375, -1.870849609375, -1.6251220703125, -1.37939453125, -1.1336669921875, -0.887939453125, -0.6422119140625, -0.396484375, -0.1507568359375, 0.094970703125, 0.3406982421875, 0.58642578125, 0.8321533203125, 1.077880859375, 1.3236083984375, 1.5693359375, 1.8150634765625, 2.060791015625, 2.3065185546875, 2.55224609375, 2.7979736328125, 3.043701171875, 3.2894287109375, 3.53515625, 3.7808837890625, 4.026611328125, 4.2723388671875, 4.51806640625, 4.7637939453125, 5.009521484375, 5.2552490234375, 5.5009765625, 5.7467041015625, 5.992431640625, 6.2381591796875, 6.48388671875, 6.7296142578125, 6.975341796875, 7.2210693359375, 7.466796875, 7.7125244140625, 7.958251953125, 8.2039794921875, 8.44970703125, 8.6954345703125, 8.941162109375, 9.1868896484375, 9.4326171875, 9.6783447265625, 9.924072265625, 10.1697998046875, 10.41552734375, 10.6612548828125, 10.906982421875, 11.1527099609375, 11.3984375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 21.0, 44.0, 84.0, 162.0, 203.0, 193.0, 142.0, 76.0, 51.0, 23.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.28515625, -3.92840576171875, -3.5716552734375, -3.21490478515625, -2.858154296875, -2.50140380859375, -2.1446533203125, -1.78790283203125, -1.43115234375, -1.07440185546875, -0.7176513671875, -0.36090087890625, -0.004150390625, 0.35260009765625, 0.7093505859375, 1.06610107421875, 1.4228515625, 1.77960205078125, 2.1363525390625, 2.49310302734375, 2.849853515625, 3.20660400390625, 3.5633544921875, 3.92010498046875, 4.27685546875, 4.63360595703125, 4.9903564453125, 5.34710693359375, 5.703857421875, 6.06060791015625, 6.4173583984375, 6.77410888671875, 7.130859375, 7.48760986328125, 7.8443603515625, 8.20111083984375, 8.557861328125, 8.91461181640625, 9.2713623046875, 9.62811279296875, 9.98486328125, 10.34161376953125, 10.6983642578125, 11.05511474609375, 11.411865234375, 11.76861572265625, 12.1253662109375, 12.48211669921875, 12.8388671875, 13.19561767578125, 13.5523681640625, 13.90911865234375, 14.265869140625, 14.62261962890625, 14.9793701171875, 15.33612060546875, 15.69287109375, 16.04962158203125, 16.4063720703125, 16.76312255859375, 17.119873046875, 17.47662353515625, 17.8333740234375, 18.19012451171875, 18.546875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 6.0, 2.0, 3.0, 6.0, 9.0, 11.0, 19.0, 35.0, 40.0, 54.0, 105.0, 147.0, 251.0, 506.0, 1052.0, 2829.0, 10970.0, 77022.0, 3434241.0, 624397.0, 33334.0, 5846.0, 1743.0, 756.0, 385.0, 197.0, 133.0, 69.0, 38.0, 26.0, 14.0, 15.0, 1.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.546875, -11.2054443359375, -10.864013671875, -10.5225830078125, -10.18115234375, -9.8397216796875, -9.498291015625, -9.1568603515625, -8.8154296875, -8.4739990234375, -8.132568359375, -7.7911376953125, -7.44970703125, -7.1082763671875, -6.766845703125, -6.4254150390625, -6.083984375, -5.7425537109375, -5.401123046875, -5.0596923828125, -4.71826171875, -4.3768310546875, -4.035400390625, -3.6939697265625, -3.3525390625, -3.0111083984375, -2.669677734375, -2.3282470703125, -1.98681640625, -1.6453857421875, -1.303955078125, -0.9625244140625, -0.62109375, -0.2796630859375, 0.061767578125, 0.4031982421875, 0.74462890625, 1.0860595703125, 1.427490234375, 1.7689208984375, 2.1103515625, 2.4517822265625, 2.793212890625, 3.1346435546875, 3.47607421875, 3.8175048828125, 4.158935546875, 4.5003662109375, 4.841796875, 5.1832275390625, 5.524658203125, 5.8660888671875, 6.20751953125, 6.5489501953125, 6.890380859375, 7.2318115234375, 7.5732421875, 7.9146728515625, 8.256103515625, 8.5975341796875, 8.93896484375, 9.2803955078125, 9.621826171875, 9.9632568359375, 10.3046875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 12.0, 7.0, 14.0, 18.0, 31.0, 48.0, 82.0, 155.0, 390.0, 1157.0, 1289.0, 479.0, 170.0, 68.0, 58.0, 30.0, 31.0, 21.0, 6.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.5, -17.040771484375, -16.58154296875, -16.122314453125, -15.6630859375, -15.203857421875, -14.74462890625, -14.285400390625, -13.826171875, -13.366943359375, -12.90771484375, -12.448486328125, -11.9892578125, -11.530029296875, -11.07080078125, -10.611572265625, -10.15234375, -9.693115234375, -9.23388671875, -8.774658203125, -8.3154296875, -7.856201171875, -7.39697265625, -6.937744140625, -6.478515625, -6.019287109375, -5.56005859375, -5.100830078125, -4.6416015625, -4.182373046875, -3.72314453125, -3.263916015625, -2.8046875, -2.345458984375, -1.88623046875, -1.427001953125, -0.9677734375, -0.508544921875, -0.04931640625, 0.409912109375, 0.869140625, 1.328369140625, 1.78759765625, 2.246826171875, 2.7060546875, 3.165283203125, 3.62451171875, 4.083740234375, 4.54296875, 5.002197265625, 5.46142578125, 5.920654296875, 6.3798828125, 6.839111328125, 7.29833984375, 7.757568359375, 8.216796875, 8.676025390625, 9.13525390625, 9.594482421875, 10.0537109375, 10.512939453125, 10.97216796875, 11.431396484375, 11.890625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 10.0, 24.0, 51.0, 152.0, 243.0, 253.0, 154.0, 59.0, 16.0, 12.0, 12.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.57564544677734, -62.462791442871094, -59.349937438964844, -56.237083435058594, -53.124229431152344, -50.011375427246094, -46.89852523803711, -43.78567123413086, -40.67281723022461, -37.55996322631836, -34.44710922241211, -31.334257125854492, -28.221403121948242, -25.108549118041992, -21.995697021484375, -18.882843017578125, -15.769989013671875, -12.657135009765625, -9.544281959533691, -6.431428909301758, -3.318574905395508, -0.2057209014892578, 2.9071311950683594, 6.019985198974609, 9.13283920288086, 12.24569320678711, 15.358546257019043, 18.471399307250977, 21.584253311157227, 24.697107315063477, 27.809959411621094, 30.922813415527344, 34.03565979003906, 37.14851379394531, 40.26136779785156, 43.37422180175781, 46.48707580566406, 49.59992980957031, 52.7127799987793, 55.82563400268555, 58.9384880065918, 62.05134201049805, 65.16419219970703, 68.27704620361328, 71.38990020751953, 74.50275421142578, 77.61560821533203, 80.72846221923828, 83.84131622314453, 86.95417022705078, 90.06702423095703, 93.17987823486328, 96.29273223876953, 99.40558624267578, 102.5184326171875, 105.63128662109375, 108.744140625, 111.85699462890625, 114.9698486328125, 118.08270263671875, 121.195556640625, 124.30841064453125, 127.4212646484375, 130.53411865234375, 133.64697265625]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 1.0, 6.0, 8.0, 17.0, 14.0, 31.0, 43.0, 39.0, 58.0, 63.0, 69.0, 90.0, 85.0, 93.0, 71.0, 83.0, 62.0, 44.0, 35.0, 23.0, 25.0, 15.0, 12.0, 9.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-93.15531921386719, -90.95466613769531, -88.75401306152344, -86.5533676147461, -84.35271453857422, -82.15206146240234, -79.95140838623047, -77.7507553100586, -75.55010986328125, -73.34945678710938, -71.1488037109375, -68.94815826416016, -66.74750518798828, -64.5468521118164, -62.34619903564453, -60.145545959472656, -57.94489288330078, -55.744239807128906, -53.5435905456543, -51.34293746948242, -49.14228820800781, -46.94163513183594, -44.74098205566406, -42.54032897949219, -40.33967971801758, -38.1390266418457, -35.938377380371094, -33.73772430419922, -31.537073135375977, -29.336421966552734, -27.13576889038086, -24.935117721557617, -22.734458923339844, -20.5338077545166, -18.33315658569336, -16.132503509521484, -13.931852340698242, -11.731201171875, -9.530549049377441, -7.329896926879883, -5.129245758056641, -2.9285941123962402, -0.7279424667358398, 1.4727091789245605, 3.673360824584961, 5.874011993408203, 8.074664115905762, 10.27531623840332, 12.475967407226562, 14.676618576049805, 16.877269744873047, 19.077922821044922, 21.278573989868164, 23.479225158691406, 25.67987823486328, 27.880529403686523, 30.081180572509766, 32.28183364868164, 34.48248291015625, 36.683135986328125, 38.8837890625, 41.08443832397461, 43.285091400146484, 45.485740661621094, 47.68639373779297]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 2.0, 10.0, 13.0, 11.0, 15.0, 14.0, 37.0, 34.0, 68.0, 129.0, 332.0, 1015.0, 3847.0, 17986.0, 105892.0, 571345.0, 291156.0, 45155.0, 8334.0, 2040.0, 607.0, 212.0, 110.0, 60.0, 37.0, 21.0, 16.0, 8.0, 12.0, 6.0, 9.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.421875, -10.1304931640625, -9.839111328125, -9.5477294921875, -9.25634765625, -8.9649658203125, -8.673583984375, -8.3822021484375, -8.0908203125, -7.7994384765625, -7.508056640625, -7.2166748046875, -6.92529296875, -6.6339111328125, -6.342529296875, -6.0511474609375, -5.759765625, -5.4683837890625, -5.177001953125, -4.8856201171875, -4.59423828125, -4.3028564453125, -4.011474609375, -3.7200927734375, -3.4287109375, -3.1373291015625, -2.845947265625, -2.5545654296875, -2.26318359375, -1.9718017578125, -1.680419921875, -1.3890380859375, -1.09765625, -0.8062744140625, -0.514892578125, -0.2235107421875, 0.06787109375, 0.3592529296875, 0.650634765625, 0.9420166015625, 1.2333984375, 1.5247802734375, 1.816162109375, 2.1075439453125, 2.39892578125, 2.6903076171875, 2.981689453125, 3.2730712890625, 3.564453125, 3.8558349609375, 4.147216796875, 4.4385986328125, 4.72998046875, 5.0213623046875, 5.312744140625, 5.6041259765625, 5.8955078125, 6.1868896484375, 6.478271484375, 6.7696533203125, 7.06103515625, 7.3524169921875, 7.643798828125, 7.9351806640625, 8.2265625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 6.0, 8.0, 7.0, 18.0, 23.0, 30.0, 43.0, 57.0, 77.0, 104.0, 108.0, 101.0, 105.0, 76.0, 89.0, 50.0, 31.0, 37.0, 21.0, 14.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.85546875, -2.66888427734375, -2.4822998046875, -2.29571533203125, -2.109130859375, -1.92254638671875, -1.7359619140625, -1.54937744140625, -1.36279296875, -1.17620849609375, -0.9896240234375, -0.80303955078125, -0.616455078125, -0.42987060546875, -0.2432861328125, -0.05670166015625, 0.1298828125, 0.31646728515625, 0.5030517578125, 0.68963623046875, 0.876220703125, 1.06280517578125, 1.2493896484375, 1.43597412109375, 1.62255859375, 1.80914306640625, 1.9957275390625, 2.18231201171875, 2.368896484375, 2.55548095703125, 2.7420654296875, 2.92864990234375, 3.115234375, 3.30181884765625, 3.4884033203125, 3.67498779296875, 3.861572265625, 4.04815673828125, 4.2347412109375, 4.42132568359375, 4.60791015625, 4.79449462890625, 4.9810791015625, 5.16766357421875, 5.354248046875, 5.54083251953125, 5.7274169921875, 5.91400146484375, 6.1005859375, 6.28717041015625, 6.4737548828125, 6.66033935546875, 6.846923828125, 7.03350830078125, 7.2200927734375, 7.40667724609375, 7.59326171875, 7.77984619140625, 7.9664306640625, 8.15301513671875, 8.339599609375, 8.52618408203125, 8.7127685546875, 8.89935302734375, 9.0859375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 6.0, 12.0, 8.0, 9.0, 6.0, 15.0, 32.0, 24.0, 45.0, 49.0, 76.0, 99.0, 111.0, 177.0, 207.0, 303.0, 419.0, 708.0, 1120.0, 2193.0, 5823.0, 21333.0, 119671.0, 685697.0, 169063.0, 27868.0, 7203.0, 2573.0, 1263.0, 753.0, 491.0, 284.0, 245.0, 148.0, 112.0, 101.0, 75.0, 53.0, 47.0, 25.0, 17.0, 28.0, 23.0, 8.0, 9.0, 7.0, 7.0, 4.0, 1.0, 5.0, 2.0], "bins": [-10.0, -9.7266845703125, -9.453369140625, -9.1800537109375, -8.90673828125, -8.6334228515625, -8.360107421875, -8.0867919921875, -7.8134765625, -7.5401611328125, -7.266845703125, -6.9935302734375, -6.72021484375, -6.4468994140625, -6.173583984375, -5.9002685546875, -5.626953125, -5.3536376953125, -5.080322265625, -4.8070068359375, -4.53369140625, -4.2603759765625, -3.987060546875, -3.7137451171875, -3.4404296875, -3.1671142578125, -2.893798828125, -2.6204833984375, -2.34716796875, -2.0738525390625, -1.800537109375, -1.5272216796875, -1.25390625, -0.9805908203125, -0.707275390625, -0.4339599609375, -0.16064453125, 0.1126708984375, 0.385986328125, 0.6593017578125, 0.9326171875, 1.2059326171875, 1.479248046875, 1.7525634765625, 2.02587890625, 2.2991943359375, 2.572509765625, 2.8458251953125, 3.119140625, 3.3924560546875, 3.665771484375, 3.9390869140625, 4.21240234375, 4.4857177734375, 4.759033203125, 5.0323486328125, 5.3056640625, 5.5789794921875, 5.852294921875, 6.1256103515625, 6.39892578125, 6.6722412109375, 6.945556640625, 7.2188720703125, 7.4921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 8.0, 20.0, 16.0, 22.0, 17.0, 22.0, 24.0, 28.0, 35.0, 40.0, 36.0, 51.0, 54.0, 48.0, 45.0, 47.0, 58.0, 49.0, 40.0, 48.0, 40.0, 36.0, 27.0, 35.0, 18.0, 19.0, 21.0, 15.0, 9.0, 9.0, 10.0, 10.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.765625, -13.36279296875, -12.9599609375, -12.55712890625, -12.154296875, -11.75146484375, -11.3486328125, -10.94580078125, -10.54296875, -10.14013671875, -9.7373046875, -9.33447265625, -8.931640625, -8.52880859375, -8.1259765625, -7.72314453125, -7.3203125, -6.91748046875, -6.5146484375, -6.11181640625, -5.708984375, -5.30615234375, -4.9033203125, -4.50048828125, -4.09765625, -3.69482421875, -3.2919921875, -2.88916015625, -2.486328125, -2.08349609375, -1.6806640625, -1.27783203125, -0.875, -0.47216796875, -0.0693359375, 0.33349609375, 0.736328125, 1.13916015625, 1.5419921875, 1.94482421875, 2.34765625, 2.75048828125, 3.1533203125, 3.55615234375, 3.958984375, 4.36181640625, 4.7646484375, 5.16748046875, 5.5703125, 5.97314453125, 6.3759765625, 6.77880859375, 7.181640625, 7.58447265625, 7.9873046875, 8.39013671875, 8.79296875, 9.19580078125, 9.5986328125, 10.00146484375, 10.404296875, 10.80712890625, 11.2099609375, 11.61279296875, 12.015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 5.0, 1.0, 2.0, 3.0, 13.0, 14.0, 21.0, 44.0, 63.0, 111.0, 167.0, 371.0, 927.0, 3374.0, 31010.0, 890554.0, 113022.0, 6489.0, 1368.0, 467.0, 215.0, 113.0, 65.0, 37.0, 40.0, 14.0, 8.0, 15.0, 3.0, 8.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7421875, -3.58416748046875, -3.4261474609375, -3.26812744140625, -3.110107421875, -2.95208740234375, -2.7940673828125, -2.63604736328125, -2.47802734375, -2.32000732421875, -2.1619873046875, -2.00396728515625, -1.845947265625, -1.68792724609375, -1.5299072265625, -1.37188720703125, -1.2138671875, -1.05584716796875, -0.8978271484375, -0.73980712890625, -0.581787109375, -0.42376708984375, -0.2657470703125, -0.10772705078125, 0.05029296875, 0.20831298828125, 0.3663330078125, 0.52435302734375, 0.682373046875, 0.84039306640625, 0.9984130859375, 1.15643310546875, 1.314453125, 1.47247314453125, 1.6304931640625, 1.78851318359375, 1.946533203125, 2.10455322265625, 2.2625732421875, 2.42059326171875, 2.57861328125, 2.73663330078125, 2.8946533203125, 3.05267333984375, 3.210693359375, 3.36871337890625, 3.5267333984375, 3.68475341796875, 3.8427734375, 4.00079345703125, 4.1588134765625, 4.31683349609375, 4.474853515625, 4.63287353515625, 4.7908935546875, 4.94891357421875, 5.10693359375, 5.26495361328125, 5.4229736328125, 5.58099365234375, 5.739013671875, 5.89703369140625, 6.0550537109375, 6.21307373046875, 6.37109375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 10.0, 18.0, 22.0, 27.0, 36.0, 57.0, 81.0, 84.0, 98.0, 112.0, 98.0, 86.0, 68.0, 50.0, 24.0, 27.0, 14.0, 18.0, 12.0, 10.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0005092620849609375, -0.000490047037601471, -0.0004708319902420044, -0.00045161694288253784, -0.0004324018955230713, -0.00041318684816360474, -0.0003939718008041382, -0.00037475675344467163, -0.0003555417060852051, -0.0003363266587257385, -0.00031711161136627197, -0.0002978965640068054, -0.00027868151664733887, -0.0002594664692878723, -0.00024025142192840576, -0.0002210363745689392, -0.00020182132720947266, -0.0001826062798500061, -0.00016339123249053955, -0.000144176185131073, -0.00012496113777160645, -0.00010574609041213989, -8.653104305267334e-05, -6.731599569320679e-05, -4.8100948333740234e-05, -2.888590097427368e-05, -9.670853614807129e-06, 9.544193744659424e-06, 2.8759241104125977e-05, 4.797428846359253e-05, 6.718933582305908e-05, 8.640438318252563e-05, 0.00010561943054199219, 0.00012483447790145874, 0.0001440495252609253, 0.00016326457262039185, 0.0001824796199798584, 0.00020169466733932495, 0.0002209097146987915, 0.00024012476205825806, 0.0002593398094177246, 0.00027855485677719116, 0.0002977699041366577, 0.00031698495149612427, 0.0003361999988555908, 0.0003554150462150574, 0.0003746300935745239, 0.0003938451409339905, 0.00041306018829345703, 0.0004322752356529236, 0.00045149028301239014, 0.0004707053303718567, 0.0004899203777313232, 0.0005091354250907898, 0.0005283504724502563, 0.0005475655198097229, 0.0005667805671691895, 0.000585995614528656, 0.0006052106618881226, 0.0006244257092475891, 0.0006436407566070557, 0.0006628558039665222, 0.0006820708513259888, 0.0007012858986854553, 0.0007205009460449219]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 4.0, 5.0, 7.0, 12.0, 14.0, 27.0, 28.0, 37.0, 46.0, 79.0, 141.0, 174.0, 280.0, 524.0, 1063.0, 2732.0, 10255.0, 77009.0, 804350.0, 131385.0, 14227.0, 3321.0, 1299.0, 601.0, 329.0, 192.0, 118.0, 72.0, 55.0, 45.0, 30.0, 23.0, 16.0, 20.0, 10.0, 3.0, 6.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-3.24609375, -3.146514892578125, -3.04693603515625, -2.947357177734375, -2.8477783203125, -2.748199462890625, -2.64862060546875, -2.549041748046875, -2.449462890625, -2.349884033203125, -2.25030517578125, -2.150726318359375, -2.0511474609375, -1.951568603515625, -1.85198974609375, -1.752410888671875, -1.65283203125, -1.553253173828125, -1.45367431640625, -1.354095458984375, -1.2545166015625, -1.154937744140625, -1.05535888671875, -0.955780029296875, -0.856201171875, -0.756622314453125, -0.65704345703125, -0.557464599609375, -0.4578857421875, -0.358306884765625, -0.25872802734375, -0.159149169921875, -0.0595703125, 0.040008544921875, 0.13958740234375, 0.239166259765625, 0.3387451171875, 0.438323974609375, 0.53790283203125, 0.637481689453125, 0.737060546875, 0.836639404296875, 0.93621826171875, 1.035797119140625, 1.1353759765625, 1.234954833984375, 1.33453369140625, 1.434112548828125, 1.53369140625, 1.633270263671875, 1.73284912109375, 1.832427978515625, 1.9320068359375, 2.031585693359375, 2.13116455078125, 2.230743408203125, 2.330322265625, 2.429901123046875, 2.52947998046875, 2.629058837890625, 2.7286376953125, 2.828216552734375, 2.92779541015625, 3.027374267578125, 3.126953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 4.0, 8.0, 11.0, 2.0, 10.0, 19.0, 24.0, 29.0, 38.0, 34.0, 57.0, 68.0, 78.0, 106.0, 90.0, 81.0, 79.0, 66.0, 40.0, 39.0, 26.0, 20.0, 17.0, 17.0, 7.0, 5.0, 7.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.8046875, -3.70733642578125, -3.6099853515625, -3.51263427734375, -3.415283203125, -3.31793212890625, -3.2205810546875, -3.12322998046875, -3.02587890625, -2.92852783203125, -2.8311767578125, -2.73382568359375, -2.636474609375, -2.53912353515625, -2.4417724609375, -2.34442138671875, -2.2470703125, -2.14971923828125, -2.0523681640625, -1.95501708984375, -1.857666015625, -1.76031494140625, -1.6629638671875, -1.56561279296875, -1.46826171875, -1.37091064453125, -1.2735595703125, -1.17620849609375, -1.078857421875, -0.98150634765625, -0.8841552734375, -0.78680419921875, -0.689453125, -0.59210205078125, -0.4947509765625, -0.39739990234375, -0.300048828125, -0.20269775390625, -0.1053466796875, -0.00799560546875, 0.08935546875, 0.18670654296875, 0.2840576171875, 0.38140869140625, 0.478759765625, 0.57611083984375, 0.6734619140625, 0.77081298828125, 0.8681640625, 0.96551513671875, 1.0628662109375, 1.16021728515625, 1.257568359375, 1.35491943359375, 1.4522705078125, 1.54962158203125, 1.64697265625, 1.74432373046875, 1.8416748046875, 1.93902587890625, 2.036376953125, 2.13372802734375, 2.2310791015625, 2.32843017578125, 2.42578125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 1.0, 5.0, 9.0, 14.0, 49.0, 98.0, 167.0, 304.0, 184.0, 93.0, 34.0, 17.0, 9.0, 6.0, 5.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.66461181640625, -115.9339599609375, -113.20330047607422, -110.47264862060547, -107.74198913574219, -105.01133728027344, -102.28068542480469, -99.5500259399414, -96.81937408447266, -94.0887222290039, -91.35806274414062, -88.62741088867188, -85.8967514038086, -83.16609954833984, -80.43544006347656, -77.70478820800781, -74.97413635253906, -72.24348449707031, -69.51282501220703, -66.78217315673828, -64.051513671875, -61.32086181640625, -58.590206146240234, -55.85955047607422, -53.12889099121094, -50.39823532104492, -47.667579650878906, -44.936927795410156, -42.20627212524414, -39.475616455078125, -36.74496078491211, -34.014305114746094, -31.283653259277344, -28.552997589111328, -25.822343826293945, -23.09168815612793, -20.361034393310547, -17.63037872314453, -14.899723052978516, -12.169069290161133, -9.438413619995117, -6.707758903503418, -3.9771037101745605, -1.2464485168457031, 1.484206199645996, 4.214860916137695, 6.945516586303711, 9.676170349121094, 12.40682601928711, 15.137480735778809, 17.868135452270508, 20.598791122436523, 23.329444885253906, 26.060100555419922, 28.790756225585938, 31.52140998840332, 34.25206756591797, 36.982723236083984, 39.71337890625, 42.44403076171875, 45.174686431884766, 47.90534210205078, 50.6359977722168, 53.36665344238281, 56.09730529785156]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 3.0, 6.0, 1.0, 5.0, 6.0, 3.0, 9.0, 20.0, 14.0, 19.0, 23.0, 22.0, 24.0, 40.0, 40.0, 36.0, 40.0, 55.0, 59.0, 84.0, 74.0, 57.0, 47.0, 38.0, 36.0, 42.0, 33.0, 26.0, 22.0, 21.0, 24.0, 12.0, 17.0, 14.0, 6.0, 7.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-50.79148483276367, -49.08391571044922, -47.376346588134766, -45.66877746582031, -43.961212158203125, -42.25364303588867, -40.54607391357422, -38.838504791259766, -37.13093566894531, -35.42336654663086, -33.715797424316406, -32.00823211669922, -30.300662994384766, -28.593093872070312, -26.88552474975586, -25.177955627441406, -23.47039031982422, -21.762821197509766, -20.055253982543945, -18.347684860229492, -16.640117645263672, -14.932548522949219, -13.224979400634766, -11.517411231994629, -9.809843063354492, -8.102274894714355, -6.3947062492370605, -4.687137603759766, -2.979569435119629, -1.2720012664794922, 0.43556785583496094, 2.1431360244750977, 3.8507080078125, 5.558276176452637, 7.265844821929932, 8.973413467407227, 10.680981636047363, 12.3885498046875, 14.096118927001953, 15.80368709564209, 17.511255264282227, 19.21882438659668, 20.9263916015625, 22.633960723876953, 24.341529846191406, 26.049097061157227, 27.75666618347168, 29.4642333984375, 31.171802520751953, 32.879371643066406, 34.58694076538086, 36.29450988769531, 38.0020751953125, 39.70964431762695, 41.417213439941406, 43.12478256225586, 44.83235168457031, 46.539920806884766, 48.24748992919922, 49.955055236816406, 51.66262435913086, 53.37019348144531, 55.077762603759766, 56.78533172607422, 58.492897033691406]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [5.0, 2.0, 3.0, 10.0, 14.0, 25.0, 56.0, 109.0, 190.0, 427.0, 1085.0, 3080.0, 10783.0, 62261.0, 986103.0, 2907958.0, 193960.0, 20187.0, 5070.0, 1621.0, 701.0, 288.0, 172.0, 73.0, 39.0, 35.0, 12.0, 7.0, 6.0, 4.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.513671875, -2.348663330078125, -2.18365478515625, -2.018646240234375, -1.8536376953125, -1.688629150390625, -1.52362060546875, -1.358612060546875, -1.193603515625, -1.028594970703125, -0.86358642578125, -0.698577880859375, -0.5335693359375, -0.368560791015625, -0.20355224609375, -0.038543701171875, 0.12646484375, 0.291473388671875, 0.45648193359375, 0.621490478515625, 0.7864990234375, 0.951507568359375, 1.11651611328125, 1.281524658203125, 1.446533203125, 1.611541748046875, 1.77655029296875, 1.941558837890625, 2.1065673828125, 2.271575927734375, 2.43658447265625, 2.601593017578125, 2.7666015625, 2.931610107421875, 3.09661865234375, 3.261627197265625, 3.4266357421875, 3.591644287109375, 3.75665283203125, 3.921661376953125, 4.086669921875, 4.251678466796875, 4.41668701171875, 4.581695556640625, 4.7467041015625, 4.911712646484375, 5.07672119140625, 5.241729736328125, 5.40673828125, 5.571746826171875, 5.73675537109375, 5.901763916015625, 6.0667724609375, 6.231781005859375, 6.39678955078125, 6.561798095703125, 6.726806640625, 6.891815185546875, 7.05682373046875, 7.221832275390625, 7.3868408203125, 7.551849365234375, 7.71685791015625, 7.881866455078125, 8.046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 3.0, 4.0, 3.0, 5.0, 10.0, 12.0, 15.0, 10.0, 14.0, 23.0, 18.0, 21.0, 37.0, 31.0, 23.0, 31.0, 45.0, 40.0, 45.0, 49.0, 47.0, 33.0, 43.0, 38.0, 41.0, 40.0, 39.0, 23.0, 36.0, 28.0, 24.0, 32.0, 19.0, 20.0, 18.0, 17.0, 10.0, 12.0, 10.0, 7.0, 6.0, 6.0, 7.0, 2.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.345306396484375, -2.26678466796875, -2.188262939453125, -2.1097412109375, -2.031219482421875, -1.95269775390625, -1.874176025390625, -1.795654296875, -1.717132568359375, -1.63861083984375, -1.560089111328125, -1.4815673828125, -1.403045654296875, -1.32452392578125, -1.246002197265625, -1.16748046875, -1.088958740234375, -1.01043701171875, -0.931915283203125, -0.8533935546875, -0.774871826171875, -0.69635009765625, -0.617828369140625, -0.539306640625, -0.460784912109375, -0.38226318359375, -0.303741455078125, -0.2252197265625, -0.146697998046875, -0.06817626953125, 0.010345458984375, 0.0888671875, 0.167388916015625, 0.24591064453125, 0.324432373046875, 0.4029541015625, 0.481475830078125, 0.55999755859375, 0.638519287109375, 0.717041015625, 0.795562744140625, 0.87408447265625, 0.952606201171875, 1.0311279296875, 1.109649658203125, 1.18817138671875, 1.266693115234375, 1.34521484375, 1.423736572265625, 1.50225830078125, 1.580780029296875, 1.6593017578125, 1.737823486328125, 1.81634521484375, 1.894866943359375, 1.973388671875, 2.051910400390625, 2.13043212890625, 2.208953857421875, 2.2874755859375, 2.365997314453125, 2.44451904296875, 2.523040771484375, 2.6015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 14.0, 12.0, 16.0, 34.0, 43.0, 88.0, 111.0, 216.0, 348.0, 883.0, 2337.0, 8297.0, 45580.0, 997602.0, 3051809.0, 72118.0, 10532.0, 2531.0, 915.0, 376.0, 169.0, 103.0, 50.0, 38.0, 22.0, 17.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.60162353515625, -9.3282470703125, -9.05487060546875, -8.781494140625, -8.50811767578125, -8.2347412109375, -7.96136474609375, -7.68798828125, -7.41461181640625, -7.1412353515625, -6.86785888671875, -6.594482421875, -6.32110595703125, -6.0477294921875, -5.77435302734375, -5.5009765625, -5.22760009765625, -4.9542236328125, -4.68084716796875, -4.407470703125, -4.13409423828125, -3.8607177734375, -3.58734130859375, -3.31396484375, -3.04058837890625, -2.7672119140625, -2.49383544921875, -2.220458984375, -1.94708251953125, -1.6737060546875, -1.40032958984375, -1.126953125, -0.85357666015625, -0.5802001953125, -0.30682373046875, -0.033447265625, 0.23992919921875, 0.5133056640625, 0.78668212890625, 1.06005859375, 1.33343505859375, 1.6068115234375, 1.88018798828125, 2.153564453125, 2.42694091796875, 2.7003173828125, 2.97369384765625, 3.2470703125, 3.52044677734375, 3.7938232421875, 4.06719970703125, 4.340576171875, 4.61395263671875, 4.8873291015625, 5.16070556640625, 5.43408203125, 5.70745849609375, 5.9808349609375, 6.25421142578125, 6.527587890625, 6.80096435546875, 7.0743408203125, 7.34771728515625, 7.62109375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 6.0, 6.0, 14.0, 18.0, 20.0, 24.0, 40.0, 48.0, 81.0, 157.0, 361.0, 803.0, 1191.0, 684.0, 260.0, 165.0, 67.0, 32.0, 30.0, 29.0, 20.0, 7.0, 3.0, 6.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.71875, -12.40399169921875, -12.0892333984375, -11.77447509765625, -11.459716796875, -11.14495849609375, -10.8302001953125, -10.51544189453125, -10.20068359375, -9.88592529296875, -9.5711669921875, -9.25640869140625, -8.941650390625, -8.62689208984375, -8.3121337890625, -7.99737548828125, -7.6826171875, -7.36785888671875, -7.0531005859375, -6.73834228515625, -6.423583984375, -6.10882568359375, -5.7940673828125, -5.47930908203125, -5.16455078125, -4.84979248046875, -4.5350341796875, -4.22027587890625, -3.905517578125, -3.59075927734375, -3.2760009765625, -2.96124267578125, -2.646484375, -2.33172607421875, -2.0169677734375, -1.70220947265625, -1.387451171875, -1.07269287109375, -0.7579345703125, -0.44317626953125, -0.12841796875, 0.18634033203125, 0.5010986328125, 0.81585693359375, 1.130615234375, 1.44537353515625, 1.7601318359375, 2.07489013671875, 2.3896484375, 2.70440673828125, 3.0191650390625, 3.33392333984375, 3.648681640625, 3.96343994140625, 4.2781982421875, 4.59295654296875, 4.90771484375, 5.22247314453125, 5.5372314453125, 5.85198974609375, 6.166748046875, 6.48150634765625, 6.7962646484375, 7.11102294921875, 7.42578125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 11.0, 24.0, 60.0, 162.0, 245.0, 241.0, 148.0, 49.0, 17.0, 11.0, 8.0, 8.0, 4.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-111.8614501953125, -109.19195556640625, -106.52245330810547, -103.85295867919922, -101.18345642089844, -98.51396179199219, -95.8444595336914, -93.17496490478516, -90.50546264648438, -87.83596801757812, -85.16646575927734, -82.4969711303711, -79.82746887207031, -77.15797424316406, -74.48847198486328, -71.81897735595703, -69.14947509765625, -66.47998046875, -63.81047821044922, -61.1409797668457, -58.47148132324219, -55.80198287963867, -53.132484436035156, -50.462989807128906, -47.793495178222656, -45.12399673461914, -42.454498291015625, -39.78499984741211, -37.115501403808594, -34.44600296020508, -31.776506423950195, -29.10700798034668, -26.43750762939453, -23.768009185791016, -21.0985107421875, -18.429012298583984, -15.759514808654785, -13.09001636505127, -10.42051887512207, -7.751020431518555, -5.081521987915039, -2.4120237827301025, 0.257474422454834, 2.9269723892211914, 5.596470832824707, 8.265969276428223, 10.935466766357422, 13.604965209960938, 16.274463653564453, 18.94396209716797, 21.613460540771484, 24.282958984375, 26.952457427978516, 29.62195587158203, 32.29145050048828, 34.96095275878906, 37.63044738769531, 40.29994583129883, 42.969444274902344, 45.63894271850586, 48.308441162109375, 50.97793960571289, 53.647438049316406, 56.316932678222656, 58.98643493652344]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 3.0, 7.0, 7.0, 13.0, 13.0, 11.0, 14.0, 22.0, 17.0, 31.0, 19.0, 28.0, 25.0, 34.0, 41.0, 44.0, 38.0, 39.0, 47.0, 55.0, 52.0, 54.0, 45.0, 54.0, 26.0, 29.0, 29.0, 23.0, 36.0, 21.0, 16.0, 20.0, 24.0, 11.0, 12.0, 9.0, 8.0, 8.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-36.39805603027344, -35.395591735839844, -34.39312744140625, -33.390663146972656, -32.3881950378418, -31.385730743408203, -30.38326644897461, -29.380802154541016, -28.378337860107422, -27.375873565673828, -26.3734073638916, -25.370943069458008, -24.368478775024414, -23.366012573242188, -22.363548278808594, -21.361083984375, -20.358617782592773, -19.35615348815918, -18.353687286376953, -17.35122299194336, -16.348758697509766, -15.346293449401855, -14.343828201293945, -13.341363906860352, -12.338898658752441, -11.336433410644531, -10.333969116210938, -9.331503868103027, -8.329038619995117, -7.326574325561523, -6.324109077453613, -5.321644306182861, -4.319177627563477, -3.3167128562927246, -2.3142478466033936, -1.3117828369140625, -0.30931806564331055, 0.6931467056274414, 1.6956119537353516, 2.6980767250061035, 3.7005414962768555, 4.703006267547607, 5.705471038818359, 6.7079362869262695, 7.7104010581970215, 8.712865829467773, 9.715331077575684, 10.717796325683594, 11.720260620117188, 12.722725868225098, 13.725190162658691, 14.727655410766602, 15.730119705200195, 16.732585906982422, 17.735050201416016, 18.73751449584961, 19.739978790283203, 20.742443084716797, 21.744909286499023, 22.747373580932617, 23.74983787536621, 24.752304077148438, 25.75476837158203, 26.757232666015625, 27.75969886779785]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 8.0, 4.0, 15.0, 13.0, 31.0, 39.0, 81.0, 146.0, 257.0, 497.0, 955.0, 1871.0, 3765.0, 8490.0, 20975.0, 54996.0, 149028.0, 379421.0, 269269.0, 96668.0, 36140.0, 14247.0, 6008.0, 2770.0, 1331.0, 673.0, 400.0, 209.0, 90.0, 68.0, 40.0, 19.0, 8.0, 7.0, 9.0, 7.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.66796875, -5.50958251953125, -5.3511962890625, -5.19281005859375, -5.034423828125, -4.87603759765625, -4.7176513671875, -4.55926513671875, -4.40087890625, -4.24249267578125, -4.0841064453125, -3.92572021484375, -3.767333984375, -3.60894775390625, -3.4505615234375, -3.29217529296875, -3.1337890625, -2.97540283203125, -2.8170166015625, -2.65863037109375, -2.500244140625, -2.34185791015625, -2.1834716796875, -2.02508544921875, -1.86669921875, -1.70831298828125, -1.5499267578125, -1.39154052734375, -1.233154296875, -1.07476806640625, -0.9163818359375, -0.75799560546875, -0.599609375, -0.44122314453125, -0.2828369140625, -0.12445068359375, 0.033935546875, 0.19232177734375, 0.3507080078125, 0.50909423828125, 0.66748046875, 0.82586669921875, 0.9842529296875, 1.14263916015625, 1.301025390625, 1.45941162109375, 1.6177978515625, 1.77618408203125, 1.9345703125, 2.09295654296875, 2.2513427734375, 2.40972900390625, 2.568115234375, 2.72650146484375, 2.8848876953125, 3.04327392578125, 3.20166015625, 3.36004638671875, 3.5184326171875, 3.67681884765625, 3.835205078125, 3.99359130859375, 4.1519775390625, 4.31036376953125, 4.46875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 3.0, 12.0, 10.0, 18.0, 8.0, 16.0, 10.0, 14.0, 17.0, 26.0, 15.0, 30.0, 36.0, 33.0, 32.0, 24.0, 39.0, 36.0, 42.0, 46.0, 36.0, 32.0, 30.0, 53.0, 34.0, 29.0, 40.0, 26.0, 30.0, 23.0, 17.0, 18.0, 16.0, 24.0, 17.0, 20.0, 11.0, 12.0, 13.0, 10.0, 8.0, 7.0, 2.0, 2.0, 4.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.130859375, -2.05908203125, -1.9873046875, -1.91552734375, -1.84375, -1.77197265625, -1.7001953125, -1.62841796875, -1.556640625, -1.48486328125, -1.4130859375, -1.34130859375, -1.26953125, -1.19775390625, -1.1259765625, -1.05419921875, -0.982421875, -0.91064453125, -0.8388671875, -0.76708984375, -0.6953125, -0.62353515625, -0.5517578125, -0.47998046875, -0.408203125, -0.33642578125, -0.2646484375, -0.19287109375, -0.12109375, -0.04931640625, 0.0224609375, 0.09423828125, 0.166015625, 0.23779296875, 0.3095703125, 0.38134765625, 0.453125, 0.52490234375, 0.5966796875, 0.66845703125, 0.740234375, 0.81201171875, 0.8837890625, 0.95556640625, 1.02734375, 1.09912109375, 1.1708984375, 1.24267578125, 1.314453125, 1.38623046875, 1.4580078125, 1.52978515625, 1.6015625, 1.67333984375, 1.7451171875, 1.81689453125, 1.888671875, 1.96044921875, 2.0322265625, 2.10400390625, 2.17578125, 2.24755859375, 2.3193359375, 2.39111328125, 2.462890625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 6.0, 14.0, 8.0, 17.0, 37.0, 32.0, 51.0, 83.0, 111.0, 180.0, 262.0, 444.0, 712.0, 1490.0, 3759.0, 15697.0, 141574.0, 781702.0, 85361.0, 11111.0, 2928.0, 1198.0, 665.0, 384.0, 231.0, 122.0, 122.0, 75.0, 52.0, 38.0, 30.0, 13.0, 10.0, 8.0, 7.0, 8.0, 2.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.6171875, -8.2489013671875, -7.880615234375, -7.5123291015625, -7.14404296875, -6.7757568359375, -6.407470703125, -6.0391845703125, -5.6708984375, -5.3026123046875, -4.934326171875, -4.5660400390625, -4.19775390625, -3.8294677734375, -3.461181640625, -3.0928955078125, -2.724609375, -2.3563232421875, -1.988037109375, -1.6197509765625, -1.25146484375, -0.8831787109375, -0.514892578125, -0.1466064453125, 0.2216796875, 0.5899658203125, 0.958251953125, 1.3265380859375, 1.69482421875, 2.0631103515625, 2.431396484375, 2.7996826171875, 3.16796875, 3.5362548828125, 3.904541015625, 4.2728271484375, 4.64111328125, 5.0093994140625, 5.377685546875, 5.7459716796875, 6.1142578125, 6.4825439453125, 6.850830078125, 7.2191162109375, 7.58740234375, 7.9556884765625, 8.323974609375, 8.6922607421875, 9.060546875, 9.4288330078125, 9.797119140625, 10.1654052734375, 10.53369140625, 10.9019775390625, 11.270263671875, 11.6385498046875, 12.0068359375, 12.3751220703125, 12.743408203125, 13.1116943359375, 13.47998046875, 13.8482666015625, 14.216552734375, 14.5848388671875, 14.953125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 5.0, 5.0, 8.0, 17.0, 23.0, 26.0, 19.0, 29.0, 31.0, 37.0, 56.0, 55.0, 41.0, 59.0, 57.0, 58.0, 61.0, 65.0, 58.0, 40.0, 38.0, 30.0, 39.0, 45.0, 19.0, 19.0, 18.0, 7.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.2545166015625, -10.813720703125, -10.3729248046875, -9.93212890625, -9.4913330078125, -9.050537109375, -8.6097412109375, -8.1689453125, -7.7281494140625, -7.287353515625, -6.8465576171875, -6.40576171875, -5.9649658203125, -5.524169921875, -5.0833740234375, -4.642578125, -4.2017822265625, -3.760986328125, -3.3201904296875, -2.87939453125, -2.4385986328125, -1.997802734375, -1.5570068359375, -1.1162109375, -0.6754150390625, -0.234619140625, 0.2061767578125, 0.64697265625, 1.0877685546875, 1.528564453125, 1.9693603515625, 2.41015625, 2.8509521484375, 3.291748046875, 3.7325439453125, 4.17333984375, 4.6141357421875, 5.054931640625, 5.4957275390625, 5.9365234375, 6.3773193359375, 6.818115234375, 7.2589111328125, 7.69970703125, 8.1405029296875, 8.581298828125, 9.0220947265625, 9.462890625, 9.9036865234375, 10.344482421875, 10.7852783203125, 11.22607421875, 11.6668701171875, 12.107666015625, 12.5484619140625, 12.9892578125, 13.4300537109375, 13.870849609375, 14.3116455078125, 14.75244140625, 15.1932373046875, 15.634033203125, 16.0748291015625, 16.515625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 7.0, 5.0, 9.0, 17.0, 31.0, 54.0, 152.0, 463.0, 2031.0, 34124.0, 984119.0, 25005.0, 1866.0, 404.0, 143.0, 54.0, 29.0, 19.0, 8.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.18359375, -6.93121337890625, -6.6788330078125, -6.42645263671875, -6.174072265625, -5.92169189453125, -5.6693115234375, -5.41693115234375, -5.16455078125, -4.91217041015625, -4.6597900390625, -4.40740966796875, -4.155029296875, -3.90264892578125, -3.6502685546875, -3.39788818359375, -3.1455078125, -2.89312744140625, -2.6407470703125, -2.38836669921875, -2.135986328125, -1.88360595703125, -1.6312255859375, -1.37884521484375, -1.12646484375, -0.87408447265625, -0.6217041015625, -0.36932373046875, -0.116943359375, 0.13543701171875, 0.3878173828125, 0.64019775390625, 0.892578125, 1.14495849609375, 1.3973388671875, 1.64971923828125, 1.902099609375, 2.15447998046875, 2.4068603515625, 2.65924072265625, 2.91162109375, 3.16400146484375, 3.4163818359375, 3.66876220703125, 3.921142578125, 4.17352294921875, 4.4259033203125, 4.67828369140625, 4.9306640625, 5.18304443359375, 5.4354248046875, 5.68780517578125, 5.940185546875, 6.19256591796875, 6.4449462890625, 6.69732666015625, 6.94970703125, 7.20208740234375, 7.4544677734375, 7.70684814453125, 7.959228515625, 8.21160888671875, 8.4639892578125, 8.71636962890625, 8.96875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 8.0, 16.0, 25.0, 30.0, 82.0, 95.0, 173.0, 180.0, 154.0, 108.0, 48.0, 33.0, 20.0, 14.0, 4.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015325546264648438, -0.0014926940202713013, -0.0014528334140777588, -0.0014129728078842163, -0.0013731122016906738, -0.0013332515954971313, -0.0012933909893035889, -0.0012535303831100464, -0.001213669776916504, -0.0011738091707229614, -0.001133948564529419, -0.0010940879583358765, -0.001054227352142334, -0.0010143667459487915, -0.000974506139755249, -0.0009346455335617065, -0.0008947849273681641, -0.0008549243211746216, -0.0008150637149810791, -0.0007752031087875366, -0.0007353425025939941, -0.0006954818964004517, -0.0006556212902069092, -0.0006157606840133667, -0.0005759000778198242, -0.0005360394716262817, -0.0004961788654327393, -0.0004563182592391968, -0.0004164576530456543, -0.0003765970468521118, -0.00033673644065856934, -0.00029687583446502686, -0.0002570152282714844, -0.0002171546220779419, -0.00017729401588439941, -0.00013743340969085693, -9.757280349731445e-05, -5.771219730377197e-05, -1.7851591110229492e-05, 2.2009015083312988e-05, 6.186962127685547e-05, 0.00010173022747039795, 0.00014159083366394043, 0.0001814514398574829, 0.0002213120460510254, 0.00026117265224456787, 0.00030103325843811035, 0.00034089386463165283, 0.0003807544708251953, 0.0004206150770187378, 0.0004604756832122803, 0.0005003362894058228, 0.0005401968955993652, 0.0005800575017929077, 0.0006199181079864502, 0.0006597787141799927, 0.0006996393203735352, 0.0007394999265670776, 0.0007793605327606201, 0.0008192211389541626, 0.0008590817451477051, 0.0008989423513412476, 0.00093880295753479, 0.0009786635637283325, 0.001018524169921875]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 3.0, 6.0, 8.0, 13.0, 16.0, 24.0, 35.0, 57.0, 90.0, 121.0, 198.0, 290.0, 596.0, 1142.0, 2850.0, 9763.0, 72200.0, 787384.0, 150993.0, 15861.0, 3842.0, 1414.0, 677.0, 394.0, 223.0, 116.0, 97.0, 33.0, 30.0, 16.0, 18.0, 14.0, 12.0, 6.0, 4.0, 6.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6015625, -2.50390625, -2.40625, -2.30859375, -2.2109375, -2.11328125, -2.015625, -1.91796875, -1.8203125, -1.72265625, -1.625, -1.52734375, -1.4296875, -1.33203125, -1.234375, -1.13671875, -1.0390625, -0.94140625, -0.84375, -0.74609375, -0.6484375, -0.55078125, -0.453125, -0.35546875, -0.2578125, -0.16015625, -0.0625, 0.03515625, 0.1328125, 0.23046875, 0.328125, 0.42578125, 0.5234375, 0.62109375, 0.71875, 0.81640625, 0.9140625, 1.01171875, 1.109375, 1.20703125, 1.3046875, 1.40234375, 1.5, 1.59765625, 1.6953125, 1.79296875, 1.890625, 1.98828125, 2.0859375, 2.18359375, 2.28125, 2.37890625, 2.4765625, 2.57421875, 2.671875, 2.76953125, 2.8671875, 2.96484375, 3.0625, 3.16015625, 3.2578125, 3.35546875, 3.453125, 3.55078125, 3.6484375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 6.0, 8.0, 5.0, 10.0, 10.0, 15.0, 10.0, 26.0, 31.0, 32.0, 37.0, 57.0, 59.0, 69.0, 77.0, 84.0, 88.0, 66.0, 68.0, 50.0, 51.0, 30.0, 27.0, 18.0, 12.0, 8.0, 11.0, 8.0, 9.0, 2.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.828125, -1.7501220703125, -1.672119140625, -1.5941162109375, -1.51611328125, -1.4381103515625, -1.360107421875, -1.2821044921875, -1.2041015625, -1.1260986328125, -1.048095703125, -0.9700927734375, -0.89208984375, -0.8140869140625, -0.736083984375, -0.6580810546875, -0.580078125, -0.5020751953125, -0.424072265625, -0.3460693359375, -0.26806640625, -0.1900634765625, -0.112060546875, -0.0340576171875, 0.0439453125, 0.1219482421875, 0.199951171875, 0.2779541015625, 0.35595703125, 0.4339599609375, 0.511962890625, 0.5899658203125, 0.66796875, 0.7459716796875, 0.823974609375, 0.9019775390625, 0.97998046875, 1.0579833984375, 1.135986328125, 1.2139892578125, 1.2919921875, 1.3699951171875, 1.447998046875, 1.5260009765625, 1.60400390625, 1.6820068359375, 1.760009765625, 1.8380126953125, 1.916015625, 1.9940185546875, 2.072021484375, 2.1500244140625, 2.22802734375, 2.3060302734375, 2.384033203125, 2.4620361328125, 2.5400390625, 2.6180419921875, 2.696044921875, 2.7740478515625, 2.85205078125, 2.9300537109375, 3.008056640625, 3.0860595703125, 3.1640625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 7.0, 21.0, 36.0, 73.0, 167.0, 346.0, 195.0, 77.0, 47.0, 19.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-116.12663269042969, -113.33516693115234, -110.543701171875, -107.75224304199219, -104.96077728271484, -102.1693115234375, -99.37785339355469, -96.58638763427734, -93.794921875, -91.00345611572266, -88.21199035644531, -85.4205322265625, -82.62906646728516, -79.83760070800781, -77.046142578125, -74.25467681884766, -71.46321105957031, -68.67174530029297, -65.88027954101562, -63.08882141113281, -60.29735565185547, -57.505889892578125, -54.71442794799805, -51.92296600341797, -49.131500244140625, -46.34003448486328, -43.5485725402832, -40.757110595703125, -37.96564483642578, -35.17417907714844, -32.38271713256836, -29.59125328063965, -26.79979705810547, -24.008333206176758, -21.216869354248047, -18.425405502319336, -15.633941650390625, -12.842477798461914, -10.051013946533203, -7.259550094604492, -4.468086242675781, -1.6766223907470703, 1.1148414611816406, 3.9063053131103516, 6.6977691650390625, 9.489233016967773, 12.280696868896484, 15.072160720825195, 17.863624572753906, 20.655088424682617, 23.446552276611328, 26.23801612854004, 29.02947998046875, 31.82094383239746, 34.61240768432617, 37.40386962890625, 40.195335388183594, 42.98680114746094, 45.778263092041016, 48.569725036621094, 51.36119079589844, 54.15265655517578, 56.94411849975586, 59.73558044433594, 62.52704620361328]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 7.0, 7.0, 7.0, 12.0, 9.0, 20.0, 22.0, 22.0, 28.0, 28.0, 21.0, 32.0, 38.0, 43.0, 44.0, 65.0, 68.0, 79.0, 67.0, 55.0, 36.0, 41.0, 31.0, 29.0, 23.0, 28.0, 23.0, 17.0, 25.0, 13.0, 9.0, 10.0, 9.0, 8.0, 5.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.67866516113281, -41.17388916015625, -39.66911315917969, -38.16434097290039, -36.65956497192383, -35.154788970947266, -33.65001678466797, -32.145240783691406, -30.640464782714844, -29.13568878173828, -27.63091468811035, -26.126140594482422, -24.62136459350586, -23.116588592529297, -21.611814498901367, -20.107040405273438, -18.602264404296875, -17.097488403320312, -15.592714309692383, -14.087939262390137, -12.58316421508789, -11.078389167785645, -9.573614120483398, -8.068839073181152, -6.564064025878906, -5.05928897857666, -3.554513931274414, -2.049738883972168, -0.5449638366699219, 0.9598112106323242, 2.4645862579345703, 3.9693613052368164, 5.4741363525390625, 6.978911399841309, 8.483686447143555, 9.9884614944458, 11.493236541748047, 12.998011589050293, 14.502786636352539, 16.00756072998047, 17.51233673095703, 19.017112731933594, 20.521886825561523, 22.026660919189453, 23.531436920166016, 25.036212921142578, 26.540987014770508, 28.045761108398438, 29.550537109375, 31.055313110351562, 32.560089111328125, 34.06486129760742, 35.569637298583984, 37.07441329956055, 38.579185485839844, 40.083961486816406, 41.58873748779297, 43.09351348876953, 44.598289489746094, 46.10306167602539, 47.60783767700195, 49.112613677978516, 50.61738586425781, 52.122161865234375, 53.62693786621094]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 8.0, 12.0, 6.0, 16.0, 24.0, 39.0, 64.0, 86.0, 131.0, 224.0, 328.0, 572.0, 1054.0, 2053.0, 4408.0, 11858.0, 43320.0, 213005.0, 1126089.0, 2154821.0, 514624.0, 89352.0, 19323.0, 6499.0, 2916.0, 1402.0, 766.0, 441.0, 290.0, 172.0, 127.0, 75.0, 55.0, 33.0, 21.0, 20.0, 14.0, 9.0, 6.0, 3.0, 7.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.57421875, -2.486236572265625, -2.39825439453125, -2.310272216796875, -2.2222900390625, -2.134307861328125, -2.04632568359375, -1.958343505859375, -1.870361328125, -1.782379150390625, -1.69439697265625, -1.606414794921875, -1.5184326171875, -1.430450439453125, -1.34246826171875, -1.254486083984375, -1.16650390625, -1.078521728515625, -0.99053955078125, -0.902557373046875, -0.8145751953125, -0.726593017578125, -0.63861083984375, -0.550628662109375, -0.462646484375, -0.374664306640625, -0.28668212890625, -0.198699951171875, -0.1107177734375, -0.022735595703125, 0.06524658203125, 0.153228759765625, 0.2412109375, 0.329193115234375, 0.41717529296875, 0.505157470703125, 0.5931396484375, 0.681121826171875, 0.76910400390625, 0.857086181640625, 0.945068359375, 1.033050537109375, 1.12103271484375, 1.209014892578125, 1.2969970703125, 1.384979248046875, 1.47296142578125, 1.560943603515625, 1.64892578125, 1.736907958984375, 1.82489013671875, 1.912872314453125, 2.0008544921875, 2.088836669921875, 2.17681884765625, 2.264801025390625, 2.352783203125, 2.440765380859375, 2.52874755859375, 2.616729736328125, 2.7047119140625, 2.792694091796875, 2.88067626953125, 2.968658447265625, 3.056640625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 10.0, 10.0, 15.0, 10.0, 10.0, 17.0, 14.0, 24.0, 23.0, 20.0, 32.0, 34.0, 24.0, 39.0, 40.0, 54.0, 30.0, 45.0, 42.0, 32.0, 37.0, 41.0, 37.0, 49.0, 23.0, 34.0, 32.0, 21.0, 20.0, 14.0, 17.0, 24.0, 18.0, 12.0, 11.0, 16.0, 10.0, 10.0, 10.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.077423095703125, -2.00640869140625, -1.935394287109375, -1.8643798828125, -1.793365478515625, -1.72235107421875, -1.651336669921875, -1.580322265625, -1.509307861328125, -1.43829345703125, -1.367279052734375, -1.2962646484375, -1.225250244140625, -1.15423583984375, -1.083221435546875, -1.01220703125, -0.941192626953125, -0.87017822265625, -0.799163818359375, -0.7281494140625, -0.657135009765625, -0.58612060546875, -0.515106201171875, -0.444091796875, -0.373077392578125, -0.30206298828125, -0.231048583984375, -0.1600341796875, -0.089019775390625, -0.01800537109375, 0.053009033203125, 0.1240234375, 0.195037841796875, 0.26605224609375, 0.337066650390625, 0.4080810546875, 0.479095458984375, 0.55010986328125, 0.621124267578125, 0.692138671875, 0.763153076171875, 0.83416748046875, 0.905181884765625, 0.9761962890625, 1.047210693359375, 1.11822509765625, 1.189239501953125, 1.26025390625, 1.331268310546875, 1.40228271484375, 1.473297119140625, 1.5443115234375, 1.615325927734375, 1.68634033203125, 1.757354736328125, 1.828369140625, 1.899383544921875, 1.97039794921875, 2.041412353515625, 2.1124267578125, 2.183441162109375, 2.25445556640625, 2.325469970703125, 2.396484375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 8.0, 6.0, 20.0, 24.0, 40.0, 72.0, 143.0, 279.0, 774.0, 3444.0, 51640.0, 4055821.0, 76364.0, 4340.0, 816.0, 259.0, 119.0, 44.0, 29.0, 8.0, 9.0, 6.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.1875, -19.7239990234375, -19.260498046875, -18.7969970703125, -18.33349609375, -17.8699951171875, -17.406494140625, -16.9429931640625, -16.4794921875, -16.0159912109375, -15.552490234375, -15.0889892578125, -14.62548828125, -14.1619873046875, -13.698486328125, -13.2349853515625, -12.771484375, -12.3079833984375, -11.844482421875, -11.3809814453125, -10.91748046875, -10.4539794921875, -9.990478515625, -9.5269775390625, -9.0634765625, -8.5999755859375, -8.136474609375, -7.6729736328125, -7.20947265625, -6.7459716796875, -6.282470703125, -5.8189697265625, -5.35546875, -4.8919677734375, -4.428466796875, -3.9649658203125, -3.50146484375, -3.0379638671875, -2.574462890625, -2.1109619140625, -1.6474609375, -1.1839599609375, -0.720458984375, -0.2569580078125, 0.20654296875, 0.6700439453125, 1.133544921875, 1.5970458984375, 2.060546875, 2.5240478515625, 2.987548828125, 3.4510498046875, 3.91455078125, 4.3780517578125, 4.841552734375, 5.3050537109375, 5.7685546875, 6.2320556640625, 6.695556640625, 7.1590576171875, 7.62255859375, 8.0860595703125, 8.549560546875, 9.0130615234375, 9.4765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 9.0, 18.0, 31.0, 41.0, 57.0, 154.0, 501.0, 1374.0, 1207.0, 403.0, 136.0, 53.0, 38.0, 20.0, 6.0, 9.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.5877685546875, -15.206787109375, -14.8258056640625, -14.44482421875, -14.0638427734375, -13.682861328125, -13.3018798828125, -12.9208984375, -12.5399169921875, -12.158935546875, -11.7779541015625, -11.39697265625, -11.0159912109375, -10.635009765625, -10.2540283203125, -9.873046875, -9.4920654296875, -9.111083984375, -8.7301025390625, -8.34912109375, -7.9681396484375, -7.587158203125, -7.2061767578125, -6.8251953125, -6.4442138671875, -6.063232421875, -5.6822509765625, -5.30126953125, -4.9202880859375, -4.539306640625, -4.1583251953125, -3.77734375, -3.3963623046875, -3.015380859375, -2.6343994140625, -2.25341796875, -1.8724365234375, -1.491455078125, -1.1104736328125, -0.7294921875, -0.3485107421875, 0.032470703125, 0.4134521484375, 0.79443359375, 1.1754150390625, 1.556396484375, 1.9373779296875, 2.318359375, 2.6993408203125, 3.080322265625, 3.4613037109375, 3.84228515625, 4.2232666015625, 4.604248046875, 4.9852294921875, 5.3662109375, 5.7471923828125, 6.128173828125, 6.5091552734375, 6.89013671875, 7.2711181640625, 7.652099609375, 8.0330810546875, 8.4140625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 11.0, 28.0, 64.0, 140.0, 225.0, 243.0, 144.0, 66.0, 39.0, 15.0, 9.0, 9.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.453041076660156, -55.15670394897461, -52.8603630065918, -50.56402587890625, -48.26768493652344, -45.97134780883789, -43.675010681152344, -41.37866973876953, -39.082332611083984, -36.78599548339844, -34.489654541015625, -32.19331741333008, -29.8969783782959, -27.60063934326172, -25.304302215576172, -23.007963180541992, -20.711624145507812, -18.415285110473633, -16.118946075439453, -13.822608947753906, -11.526269912719727, -9.229930877685547, -6.933592796325684, -4.63725471496582, -2.3409156799316406, -0.04457712173461914, 2.2517614364624023, 4.548099994659424, 6.844438552856445, 9.140777587890625, 11.437115669250488, 13.733453750610352, 16.02978515625, 18.32612419128418, 20.62246322631836, 22.918800354003906, 25.215139389038086, 27.511478424072266, 29.807815551757812, 32.104156494140625, 34.40049362182617, 36.69683074951172, 38.99317169189453, 41.28950881958008, 43.585845947265625, 45.88218688964844, 48.178524017333984, 50.47486114501953, 52.771202087402344, 55.06753921508789, 57.3638801574707, 59.66021728515625, 61.95655822753906, 64.25289916992188, 66.54923248291016, 68.84557342529297, 71.14190673828125, 73.43824768066406, 75.73458099365234, 78.03092193603516, 80.32726287841797, 82.62359619140625, 84.91993713378906, 87.21627807617188, 89.51261901855469]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 7.0, 5.0, 13.0, 16.0, 23.0, 27.0, 26.0, 27.0, 47.0, 23.0, 34.0, 51.0, 59.0, 59.0, 63.0, 64.0, 46.0, 43.0, 38.0, 37.0, 41.0, 34.0, 48.0, 26.0, 29.0, 20.0, 14.0, 23.0, 7.0, 7.0, 11.0, 6.0, 5.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.568527221679688, -28.536561965942383, -27.504594802856445, -26.47262954711914, -25.440662384033203, -24.4086971282959, -23.376731872558594, -22.344764709472656, -21.31279945373535, -20.280834197998047, -19.24886703491211, -18.216901779174805, -17.1849365234375, -16.152969360351562, -15.121004104614258, -14.089037895202637, -13.057071685791016, -12.025105476379395, -10.993139266967773, -9.961174011230469, -8.929207801818848, -7.897241592407227, -6.865275859832764, -5.833310127258301, -4.80134391784668, -3.7693779468536377, -2.7374119758605957, -1.7054460048675537, -0.6734800338745117, 0.3584861755371094, 1.3904519081115723, 2.422417640686035, 3.4543800354003906, 4.486346244812012, 5.518311977386475, 6.5502777099609375, 7.582243919372559, 8.61421012878418, 9.646175384521484, 10.678141593933105, 11.710107803344727, 12.742074012756348, 13.774040222167969, 14.806005477905273, 15.837971687316895, 16.869937896728516, 17.90190315246582, 18.933868408203125, 19.965835571289062, 20.997800827026367, 22.029767990112305, 23.06173324584961, 24.093700408935547, 25.12566566467285, 26.157630920410156, 27.189598083496094, 28.2215633392334, 29.253528594970703, 30.28549575805664, 31.317461013793945, 32.34942626953125, 33.38139343261719, 34.413360595703125, 35.4453239440918, 36.477291107177734]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 8.0, 14.0, 14.0, 9.0, 33.0, 35.0, 33.0, 47.0, 84.0, 92.0, 104.0, 184.0, 226.0, 356.0, 564.0, 788.0, 1304.0, 2341.0, 3778.0, 6552.0, 12007.0, 22797.0, 45020.0, 93277.0, 186772.0, 275601.0, 195725.0, 98699.0, 47940.0, 24403.0, 12719.0, 6770.0, 3855.0, 2267.0, 1411.0, 910.0, 539.0, 394.0, 286.0, 158.0, 121.0, 87.0, 59.0, 41.0, 40.0, 31.0, 21.0, 8.0, 5.0, 12.0, 11.0, 1.0, 8.0, 0.0, 2.0, 0.0, 2.0], "bins": [-3.1796875, -3.08197021484375, -2.9842529296875, -2.88653564453125, -2.788818359375, -2.69110107421875, -2.5933837890625, -2.49566650390625, -2.39794921875, -2.30023193359375, -2.2025146484375, -2.10479736328125, -2.007080078125, -1.90936279296875, -1.8116455078125, -1.71392822265625, -1.6162109375, -1.51849365234375, -1.4207763671875, -1.32305908203125, -1.225341796875, -1.12762451171875, -1.0299072265625, -0.93218994140625, -0.83447265625, -0.73675537109375, -0.6390380859375, -0.54132080078125, -0.443603515625, -0.34588623046875, -0.2481689453125, -0.15045166015625, -0.052734375, 0.04498291015625, 0.1427001953125, 0.24041748046875, 0.338134765625, 0.43585205078125, 0.5335693359375, 0.63128662109375, 0.72900390625, 0.82672119140625, 0.9244384765625, 1.02215576171875, 1.119873046875, 1.21759033203125, 1.3153076171875, 1.41302490234375, 1.5107421875, 1.60845947265625, 1.7061767578125, 1.80389404296875, 1.901611328125, 1.99932861328125, 2.0970458984375, 2.19476318359375, 2.29248046875, 2.39019775390625, 2.4879150390625, 2.58563232421875, 2.683349609375, 2.78106689453125, 2.8787841796875, 2.97650146484375, 3.07421875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 4.0, 3.0, 7.0, 5.0, 11.0, 7.0, 6.0, 16.0, 11.0, 12.0, 15.0, 16.0, 21.0, 34.0, 22.0, 33.0, 31.0, 41.0, 52.0, 40.0, 38.0, 32.0, 41.0, 39.0, 37.0, 32.0, 31.0, 35.0, 35.0, 37.0, 31.0, 25.0, 23.0, 20.0, 20.0, 19.0, 21.0, 11.0, 13.0, 6.0, 12.0, 15.0, 7.0, 12.0, 6.0, 3.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0], "bins": [-2.380859375, -2.305206298828125, -2.22955322265625, -2.153900146484375, -2.0782470703125, -2.002593994140625, -1.92694091796875, -1.851287841796875, -1.775634765625, -1.699981689453125, -1.62432861328125, -1.548675537109375, -1.4730224609375, -1.397369384765625, -1.32171630859375, -1.246063232421875, -1.17041015625, -1.094757080078125, -1.01910400390625, -0.943450927734375, -0.8677978515625, -0.792144775390625, -0.71649169921875, -0.640838623046875, -0.565185546875, -0.489532470703125, -0.41387939453125, -0.338226318359375, -0.2625732421875, -0.186920166015625, -0.11126708984375, -0.035614013671875, 0.0400390625, 0.115692138671875, 0.19134521484375, 0.266998291015625, 0.3426513671875, 0.418304443359375, 0.49395751953125, 0.569610595703125, 0.645263671875, 0.720916748046875, 0.79656982421875, 0.872222900390625, 0.9478759765625, 1.023529052734375, 1.09918212890625, 1.174835205078125, 1.25048828125, 1.326141357421875, 1.40179443359375, 1.477447509765625, 1.5531005859375, 1.628753662109375, 1.70440673828125, 1.780059814453125, 1.855712890625, 1.931365966796875, 2.00701904296875, 2.082672119140625, 2.1583251953125, 2.233978271484375, 2.30963134765625, 2.385284423828125, 2.4609375]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 0.0, 3.0, 1.0, 5.0, 1.0, 11.0, 15.0, 11.0, 16.0, 24.0, 41.0, 60.0, 83.0, 148.0, 287.0, 617.0, 1692.0, 5919.0, 31087.0, 259843.0, 671358.0, 62814.0, 10215.0, 2578.0, 867.0, 349.0, 185.0, 128.0, 65.0, 37.0, 38.0, 13.0, 11.0, 10.0, 8.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.375, -10.080078125, -9.78515625, -9.490234375, -9.1953125, -8.900390625, -8.60546875, -8.310546875, -8.015625, -7.720703125, -7.42578125, -7.130859375, -6.8359375, -6.541015625, -6.24609375, -5.951171875, -5.65625, -5.361328125, -5.06640625, -4.771484375, -4.4765625, -4.181640625, -3.88671875, -3.591796875, -3.296875, -3.001953125, -2.70703125, -2.412109375, -2.1171875, -1.822265625, -1.52734375, -1.232421875, -0.9375, -0.642578125, -0.34765625, -0.052734375, 0.2421875, 0.537109375, 0.83203125, 1.126953125, 1.421875, 1.716796875, 2.01171875, 2.306640625, 2.6015625, 2.896484375, 3.19140625, 3.486328125, 3.78125, 4.076171875, 4.37109375, 4.666015625, 4.9609375, 5.255859375, 5.55078125, 5.845703125, 6.140625, 6.435546875, 6.73046875, 7.025390625, 7.3203125, 7.615234375, 7.91015625, 8.205078125, 8.5]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 5.0, 8.0, 16.0, 9.0, 10.0, 21.0, 11.0, 21.0, 27.0, 24.0, 31.0, 41.0, 35.0, 39.0, 47.0, 55.0, 63.0, 47.0, 49.0, 58.0, 67.0, 48.0, 32.0, 29.0, 31.0, 19.0, 27.0, 20.0, 17.0, 19.0, 7.0, 9.0, 16.0, 9.0, 10.0, 6.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.34375, -11.0234375, -10.703125, -10.3828125, -10.0625, -9.7421875, -9.421875, -9.1015625, -8.78125, -8.4609375, -8.140625, -7.8203125, -7.5, -7.1796875, -6.859375, -6.5390625, -6.21875, -5.8984375, -5.578125, -5.2578125, -4.9375, -4.6171875, -4.296875, -3.9765625, -3.65625, -3.3359375, -3.015625, -2.6953125, -2.375, -2.0546875, -1.734375, -1.4140625, -1.09375, -0.7734375, -0.453125, -0.1328125, 0.1875, 0.5078125, 0.828125, 1.1484375, 1.46875, 1.7890625, 2.109375, 2.4296875, 2.75, 3.0703125, 3.390625, 3.7109375, 4.03125, 4.3515625, 4.671875, 4.9921875, 5.3125, 5.6328125, 5.953125, 6.2734375, 6.59375, 6.9140625, 7.234375, 7.5546875, 7.875, 8.1953125, 8.515625, 8.8359375, 9.15625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 5.0, 5.0, 4.0, 8.0, 13.0, 20.0, 28.0, 37.0, 54.0, 73.0, 131.0, 262.0, 516.0, 1172.0, 3100.0, 9982.0, 38838.0, 188097.0, 628208.0, 136617.0, 28979.0, 7776.0, 2586.0, 1016.0, 420.0, 242.0, 119.0, 85.0, 38.0, 35.0, 24.0, 16.0, 15.0, 9.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8564453125, -1.7991485595703125, -1.741851806640625, -1.6845550537109375, -1.62725830078125, -1.5699615478515625, -1.512664794921875, -1.4553680419921875, -1.3980712890625, -1.3407745361328125, -1.283477783203125, -1.2261810302734375, -1.16888427734375, -1.1115875244140625, -1.054290771484375, -0.9969940185546875, -0.939697265625, -0.8824005126953125, -0.825103759765625, -0.7678070068359375, -0.71051025390625, -0.6532135009765625, -0.595916748046875, -0.5386199951171875, -0.4813232421875, -0.4240264892578125, -0.366729736328125, -0.3094329833984375, -0.25213623046875, -0.1948394775390625, -0.137542724609375, -0.0802459716796875, -0.02294921875, 0.0343475341796875, 0.091644287109375, 0.1489410400390625, 0.20623779296875, 0.2635345458984375, 0.320831298828125, 0.3781280517578125, 0.4354248046875, 0.4927215576171875, 0.550018310546875, 0.6073150634765625, 0.66461181640625, 0.7219085693359375, 0.779205322265625, 0.8365020751953125, 0.893798828125, 0.9510955810546875, 1.008392333984375, 1.0656890869140625, 1.12298583984375, 1.1802825927734375, 1.237579345703125, 1.2948760986328125, 1.3521728515625, 1.4094696044921875, 1.466766357421875, 1.5240631103515625, 1.58135986328125, 1.6386566162109375, 1.695953369140625, 1.7532501220703125, 1.810546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 4.0, 3.0, 9.0, 16.0, 6.0, 24.0, 19.0, 17.0, 20.0, 44.0, 45.0, 72.0, 62.0, 80.0, 75.0, 71.0, 61.0, 73.0, 59.0, 54.0, 27.0, 31.0, 37.0, 23.0, 17.0, 17.0, 9.0, 3.0, 7.0, 3.0, 7.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005083084106445312, -0.0004930309951305389, -0.00047775357961654663, -0.0004624761641025543, -0.000447198748588562, -0.0004319213330745697, -0.0004166439175605774, -0.0004013665020465851, -0.0003860890865325928, -0.00037081167101860046, -0.00035553425550460815, -0.00034025683999061584, -0.00032497942447662354, -0.0003097020089626312, -0.0002944245934486389, -0.0002791471779346466, -0.0002638697624206543, -0.000248592346906662, -0.00023331493139266968, -0.00021803751587867737, -0.00020276010036468506, -0.00018748268485069275, -0.00017220526933670044, -0.00015692785382270813, -0.00014165043830871582, -0.0001263730227947235, -0.0001110956072807312, -9.581819176673889e-05, -8.054077625274658e-05, -6.526336073875427e-05, -4.998594522476196e-05, -3.470852971076965e-05, -1.9431114196777344e-05, -4.153698682785034e-06, 1.1123716831207275e-05, 2.6401132345199585e-05, 4.1678547859191895e-05, 5.6955963373184204e-05, 7.223337888717651e-05, 8.751079440116882e-05, 0.00010278820991516113, 0.00011806562542915344, 0.00013334304094314575, 0.00014862045645713806, 0.00016389787197113037, 0.00017917528748512268, 0.000194452702999115, 0.0002097301185131073, 0.0002250075340270996, 0.00024028494954109192, 0.00025556236505508423, 0.00027083978056907654, 0.00028611719608306885, 0.00030139461159706116, 0.00031667202711105347, 0.0003319494426250458, 0.0003472268581390381, 0.0003625042736530304, 0.0003777816891670227, 0.000393059104681015, 0.0004083365201950073, 0.00042361393570899963, 0.00043889135122299194, 0.00045416876673698425, 0.00046944618225097656]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 17.0, 14.0, 32.0, 57.0, 70.0, 184.0, 479.0, 1411.0, 7481.0, 78217.0, 813842.0, 133206.0, 10650.0, 1854.0, 562.0, 223.0, 102.0, 59.0, 40.0, 19.0, 9.0, 10.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9033203125, -1.8009490966796875, -1.698577880859375, -1.5962066650390625, -1.49383544921875, -1.3914642333984375, -1.289093017578125, -1.1867218017578125, -1.0843505859375, -0.9819793701171875, -0.879608154296875, -0.7772369384765625, -0.67486572265625, -0.5724945068359375, -0.470123291015625, -0.3677520751953125, -0.265380859375, -0.1630096435546875, -0.060638427734375, 0.0417327880859375, 0.14410400390625, 0.2464752197265625, 0.348846435546875, 0.4512176513671875, 0.5535888671875, 0.6559600830078125, 0.758331298828125, 0.8607025146484375, 0.96307373046875, 1.0654449462890625, 1.167816162109375, 1.2701873779296875, 1.37255859375, 1.4749298095703125, 1.577301025390625, 1.6796722412109375, 1.78204345703125, 1.8844146728515625, 1.986785888671875, 2.0891571044921875, 2.1915283203125, 2.2938995361328125, 2.396270751953125, 2.4986419677734375, 2.60101318359375, 2.7033843994140625, 2.805755615234375, 2.9081268310546875, 3.010498046875, 3.1128692626953125, 3.215240478515625, 3.3176116943359375, 3.41998291015625, 3.5223541259765625, 3.624725341796875, 3.7270965576171875, 3.8294677734375, 3.9318389892578125, 4.034210205078125, 4.1365814208984375, 4.23895263671875, 4.3413238525390625, 4.443695068359375, 4.5460662841796875, 4.6484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 7.0, 10.0, 15.0, 14.0, 36.0, 38.0, 44.0, 42.0, 65.0, 86.0, 94.0, 50.0, 83.0, 79.0, 68.0, 69.0, 55.0, 33.0, 27.0, 24.0, 16.0, 11.0, 11.0, 10.0, 1.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.013671875, -1.93927001953125, -1.8648681640625, -1.79046630859375, -1.716064453125, -1.64166259765625, -1.5672607421875, -1.49285888671875, -1.41845703125, -1.34405517578125, -1.2696533203125, -1.19525146484375, -1.120849609375, -1.04644775390625, -0.9720458984375, -0.89764404296875, -0.8232421875, -0.74884033203125, -0.6744384765625, -0.60003662109375, -0.525634765625, -0.45123291015625, -0.3768310546875, -0.30242919921875, -0.22802734375, -0.15362548828125, -0.0792236328125, -0.00482177734375, 0.069580078125, 0.14398193359375, 0.2183837890625, 0.29278564453125, 0.3671875, 0.44158935546875, 0.5159912109375, 0.59039306640625, 0.664794921875, 0.73919677734375, 0.8135986328125, 0.88800048828125, 0.96240234375, 1.03680419921875, 1.1112060546875, 1.18560791015625, 1.260009765625, 1.33441162109375, 1.4088134765625, 1.48321533203125, 1.5576171875, 1.63201904296875, 1.7064208984375, 1.78082275390625, 1.855224609375, 1.92962646484375, 2.0040283203125, 2.07843017578125, 2.15283203125, 2.22723388671875, 2.3016357421875, 2.37603759765625, 2.450439453125, 2.52484130859375, 2.5992431640625, 2.67364501953125, 2.748046875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 8.0, 3.0, 12.0, 10.0, 12.0, 20.0, 37.0, 84.0, 120.0, 219.0, 243.0, 104.0, 58.0, 29.0, 17.0, 11.0, 5.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.42758560180664, -53.9317741394043, -52.43595886230469, -50.940147399902344, -49.4443359375, -47.948524475097656, -46.45271301269531, -44.9568977355957, -43.46108627319336, -41.965274810791016, -40.469459533691406, -38.97364807128906, -37.47783660888672, -35.982025146484375, -34.48621368408203, -32.99039840698242, -31.494586944580078, -29.998775482177734, -28.502962112426758, -27.00714874267578, -25.511337280273438, -24.015525817871094, -22.519712448120117, -21.02389907836914, -19.528087615966797, -18.032276153564453, -16.536462783813477, -15.040650367736816, -13.544837951660156, -12.049025535583496, -10.553213119506836, -9.057400703430176, -7.561592102050781, -6.065779685974121, -4.569967269897461, -3.074154853820801, -1.5783424377441406, -0.08253002166748047, 1.4132823944091797, 2.90909481048584, 4.4049072265625, 5.90071964263916, 7.39653205871582, 8.89234447479248, 10.38815689086914, 11.8839693069458, 13.379781723022461, 14.875594139099121, 16.37140655517578, 17.867218017578125, 19.3630313873291, 20.858844757080078, 22.354656219482422, 23.850467681884766, 25.346281051635742, 26.84209442138672, 28.337905883789062, 29.833717346191406, 31.329530715942383, 32.82534408569336, 34.3211555480957, 35.81696701049805, 37.312782287597656, 38.80859375, 40.304405212402344]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 8.0, 7.0, 9.0, 9.0, 15.0, 9.0, 17.0, 9.0, 17.0, 17.0, 19.0, 18.0, 31.0, 20.0, 32.0, 28.0, 35.0, 59.0, 72.0, 78.0, 70.0, 56.0, 49.0, 45.0, 31.0, 26.0, 31.0, 26.0, 20.0, 23.0, 15.0, 12.0, 13.0, 8.0, 9.0, 7.0, 6.0, 7.0, 7.0, 5.0, 1.0, 1.0, 6.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-34.654518127441406, -33.57296371459961, -32.49141311645508, -31.40985870361328, -30.328304290771484, -29.24675178527832, -28.165199279785156, -27.08364486694336, -26.002090454101562, -24.9205379486084, -23.8389835357666, -22.757431030273438, -21.67587661743164, -20.594324111938477, -19.512771606445312, -18.431217193603516, -17.34966468811035, -16.268112182617188, -15.18655776977539, -14.105005264282227, -13.02345085144043, -11.941898345947266, -10.860344886779785, -9.778791427612305, -8.697237968444824, -7.615684509277344, -6.534131050109863, -5.452578067779541, -4.3710246086120605, -3.28947114944458, -2.207918167114258, -1.1263647079467773, -0.044811248779296875, 1.036742091178894, 2.118295431137085, 3.1998486518859863, 4.281402111053467, 5.362955570220947, 6.4445085525512695, 7.52606201171875, 8.60761547088623, 9.689168930053711, 10.770722389221191, 11.852275848388672, 12.933828353881836, 14.015382766723633, 15.096935272216797, 16.178489685058594, 17.260042190551758, 18.341594696044922, 19.42314910888672, 20.504701614379883, 21.58625602722168, 22.667808532714844, 23.74936294555664, 24.830915451049805, 25.91246795654297, 26.994020462036133, 28.07557487487793, 29.157127380371094, 30.23868179321289, 31.320234298706055, 32.40178680419922, 33.483341217041016, 34.56489562988281]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 6.0, 2.0, 13.0, 12.0, 18.0, 25.0, 37.0, 46.0, 61.0, 87.0, 114.0, 172.0, 251.0, 345.0, 537.0, 911.0, 1483.0, 2858.0, 6071.0, 15029.0, 40581.0, 118721.0, 369930.0, 1168885.0, 1616282.0, 576844.0, 180310.0, 58586.0, 20248.0, 7823.0, 3212.0, 1732.0, 941.0, 636.0, 450.0, 307.0, 187.0, 154.0, 103.0, 79.0, 49.0, 43.0, 34.0, 18.0, 12.0, 10.0, 9.0, 7.0, 7.0, 3.0, 5.0, 2.0, 3.0], "bins": [-2.22265625, -2.15948486328125, -2.0963134765625, -2.03314208984375, -1.969970703125, -1.90679931640625, -1.8436279296875, -1.78045654296875, -1.71728515625, -1.65411376953125, -1.5909423828125, -1.52777099609375, -1.464599609375, -1.40142822265625, -1.3382568359375, -1.27508544921875, -1.2119140625, -1.14874267578125, -1.0855712890625, -1.02239990234375, -0.959228515625, -0.89605712890625, -0.8328857421875, -0.76971435546875, -0.70654296875, -0.64337158203125, -0.5802001953125, -0.51702880859375, -0.453857421875, -0.39068603515625, -0.3275146484375, -0.26434326171875, -0.201171875, -0.13800048828125, -0.0748291015625, -0.01165771484375, 0.051513671875, 0.11468505859375, 0.1778564453125, 0.24102783203125, 0.30419921875, 0.36737060546875, 0.4305419921875, 0.49371337890625, 0.556884765625, 0.62005615234375, 0.6832275390625, 0.74639892578125, 0.8095703125, 0.87274169921875, 0.9359130859375, 0.99908447265625, 1.062255859375, 1.12542724609375, 1.1885986328125, 1.25177001953125, 1.31494140625, 1.37811279296875, 1.4412841796875, 1.50445556640625, 1.567626953125, 1.63079833984375, 1.6939697265625, 1.75714111328125, 1.8203125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 7.0, 11.0, 14.0, 16.0, 6.0, 12.0, 13.0, 21.0, 26.0, 30.0, 38.0, 39.0, 42.0, 58.0, 49.0, 27.0, 43.0, 39.0, 53.0, 49.0, 51.0, 43.0, 49.0, 35.0, 33.0, 26.0, 34.0, 30.0, 18.0, 18.0, 12.0, 7.0, 12.0, 12.0, 7.0, 4.0, 9.0, 3.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.453125, -2.362060546875, -2.27099609375, -2.179931640625, -2.0888671875, -1.997802734375, -1.90673828125, -1.815673828125, -1.724609375, -1.633544921875, -1.54248046875, -1.451416015625, -1.3603515625, -1.269287109375, -1.17822265625, -1.087158203125, -0.99609375, -0.905029296875, -0.81396484375, -0.722900390625, -0.6318359375, -0.540771484375, -0.44970703125, -0.358642578125, -0.267578125, -0.176513671875, -0.08544921875, 0.005615234375, 0.0966796875, 0.187744140625, 0.27880859375, 0.369873046875, 0.4609375, 0.552001953125, 0.64306640625, 0.734130859375, 0.8251953125, 0.916259765625, 1.00732421875, 1.098388671875, 1.189453125, 1.280517578125, 1.37158203125, 1.462646484375, 1.5537109375, 1.644775390625, 1.73583984375, 1.826904296875, 1.91796875, 2.009033203125, 2.10009765625, 2.191162109375, 2.2822265625, 2.373291015625, 2.46435546875, 2.555419921875, 2.646484375, 2.737548828125, 2.82861328125, 2.919677734375, 3.0107421875, 3.101806640625, 3.19287109375, 3.283935546875, 3.375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 8.0, 14.0, 14.0, 18.0, 48.0, 105.0, 201.0, 588.0, 2196.0, 25763.0, 3924820.0, 232612.0, 6037.0, 1115.0, 403.0, 157.0, 79.0, 49.0, 25.0, 9.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5625, -8.168701171875, -7.77490234375, -7.381103515625, -6.9873046875, -6.593505859375, -6.19970703125, -5.805908203125, -5.412109375, -5.018310546875, -4.62451171875, -4.230712890625, -3.8369140625, -3.443115234375, -3.04931640625, -2.655517578125, -2.26171875, -1.867919921875, -1.47412109375, -1.080322265625, -0.6865234375, -0.292724609375, 0.10107421875, 0.494873046875, 0.888671875, 1.282470703125, 1.67626953125, 2.070068359375, 2.4638671875, 2.857666015625, 3.25146484375, 3.645263671875, 4.0390625, 4.432861328125, 4.82666015625, 5.220458984375, 5.6142578125, 6.008056640625, 6.40185546875, 6.795654296875, 7.189453125, 7.583251953125, 7.97705078125, 8.370849609375, 8.7646484375, 9.158447265625, 9.55224609375, 9.946044921875, 10.33984375, 10.733642578125, 11.12744140625, 11.521240234375, 11.9150390625, 12.308837890625, 12.70263671875, 13.096435546875, 13.490234375, 13.884033203125, 14.27783203125, 14.671630859375, 15.0654296875, 15.459228515625, 15.85302734375, 16.246826171875, 16.640625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 6.0, 12.0, 14.0, 20.0, 26.0, 63.0, 113.0, 227.0, 457.0, 895.0, 1100.0, 619.0, 242.0, 111.0, 65.0, 40.0, 23.0, 9.0, 9.0, 6.0, 4.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16015625, -4.90374755859375, -4.6473388671875, -4.39093017578125, -4.134521484375, -3.87811279296875, -3.6217041015625, -3.36529541015625, -3.10888671875, -2.85247802734375, -2.5960693359375, -2.33966064453125, -2.083251953125, -1.82684326171875, -1.5704345703125, -1.31402587890625, -1.0576171875, -0.80120849609375, -0.5447998046875, -0.28839111328125, -0.031982421875, 0.22442626953125, 0.4808349609375, 0.73724365234375, 0.99365234375, 1.25006103515625, 1.5064697265625, 1.76287841796875, 2.019287109375, 2.27569580078125, 2.5321044921875, 2.78851318359375, 3.044921875, 3.30133056640625, 3.5577392578125, 3.81414794921875, 4.070556640625, 4.32696533203125, 4.5833740234375, 4.83978271484375, 5.09619140625, 5.35260009765625, 5.6090087890625, 5.86541748046875, 6.121826171875, 6.37823486328125, 6.6346435546875, 6.89105224609375, 7.1474609375, 7.40386962890625, 7.6602783203125, 7.91668701171875, 8.173095703125, 8.42950439453125, 8.6859130859375, 8.94232177734375, 9.19873046875, 9.45513916015625, 9.7115478515625, 9.96795654296875, 10.224365234375, 10.48077392578125, 10.7371826171875, 10.99359130859375, 11.25]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 14.0, 23.0, 46.0, 68.0, 144.0, 176.0, 197.0, 137.0, 78.0, 36.0, 27.0, 15.0, 12.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-54.6044921875, -53.23634719848633, -51.868202209472656, -50.500057220458984, -49.13191223144531, -47.76376724243164, -46.39562225341797, -45.02747344970703, -43.659332275390625, -42.29118728637695, -40.92304229736328, -39.55489730834961, -38.18675231933594, -36.818607330322266, -35.450462341308594, -34.082313537597656, -32.714168548583984, -31.346023559570312, -29.97787857055664, -28.60973358154297, -27.241588592529297, -25.873443603515625, -24.50529670715332, -23.13715171813965, -21.769006729125977, -20.400861740112305, -19.032716751098633, -17.664569854736328, -16.296424865722656, -14.9282808303833, -13.560134887695312, -12.19198989868164, -10.823841094970703, -9.455696105957031, -8.08755111694336, -6.719405174255371, -5.351260185241699, -3.9831151962280273, -2.614969253540039, -1.2468242645263672, 0.12132072448730469, 1.4894659519195557, 2.8576111793518066, 4.225756645202637, 5.593901634216309, 6.9620466232299805, 8.330192565917969, 9.69833755493164, 11.066482543945312, 12.434627532958984, 13.802772521972656, 15.170918464660645, 16.5390625, 17.907207489013672, 19.275354385375977, 20.64349937438965, 22.01164436340332, 23.379789352416992, 24.747934341430664, 26.11608123779297, 27.48422622680664, 28.852371215820312, 30.220516204833984, 31.588661193847656, 32.95680618286133]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 14.0, 12.0, 11.0, 12.0, 14.0, 26.0, 25.0, 25.0, 15.0, 41.0, 33.0, 43.0, 50.0, 46.0, 49.0, 51.0, 44.0, 44.0, 48.0, 62.0, 43.0, 34.0, 36.0, 27.0, 32.0, 21.0, 20.0, 17.0, 7.0, 22.0, 10.0, 11.0, 13.0, 6.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.924091339111328, -22.178064346313477, -21.432037353515625, -20.686010360717773, -19.939983367919922, -19.19395637512207, -18.44792938232422, -17.701900482177734, -16.955875396728516, -16.209848403930664, -15.463821411132812, -14.717794418334961, -13.97176742553711, -13.225740432739258, -12.47971248626709, -11.733685493469238, -10.98765754699707, -10.241630554199219, -9.495603561401367, -8.749576568603516, -8.003549575805664, -7.257522106170654, -6.5114946365356445, -5.765467643737793, -5.019440650939941, -4.27341365814209, -3.527386426925659, -2.7813591957092285, -2.035332202911377, -1.2893052101135254, -0.5432777404785156, 0.20274925231933594, 0.9487762451171875, 1.6948033571243286, 2.4408304691314697, 3.1868577003479004, 3.932884693145752, 4.6789116859436035, 5.424939155578613, 6.170966148376465, 6.916993141174316, 7.663020133972168, 8.40904712677002, 9.155075073242188, 9.901102066040039, 10.64712905883789, 11.393156051635742, 12.139183044433594, 12.885210037231445, 13.631237030029297, 14.377264022827148, 15.123291015625, 15.869318008422852, 16.615345001220703, 17.361373901367188, 18.107398986816406, 18.85342788696289, 19.599454879760742, 20.345481872558594, 21.091508865356445, 21.837535858154297, 22.58356285095215, 23.32958984375, 24.075618743896484, 24.821643829345703]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 6.0, 12.0, 16.0, 23.0, 29.0, 47.0, 80.0, 88.0, 131.0, 202.0, 311.0, 485.0, 796.0, 1466.0, 2581.0, 4924.0, 10148.0, 22268.0, 51206.0, 127584.0, 311247.0, 302263.0, 121577.0, 49053.0, 21405.0, 9727.0, 4709.0, 2442.0, 1434.0, 854.0, 511.0, 303.0, 202.0, 138.0, 79.0, 62.0, 33.0, 28.0, 29.0, 19.0, 12.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.900390625, -3.778411865234375, -3.65643310546875, -3.534454345703125, -3.4124755859375, -3.290496826171875, -3.16851806640625, -3.046539306640625, -2.924560546875, -2.802581787109375, -2.68060302734375, -2.558624267578125, -2.4366455078125, -2.314666748046875, -2.19268798828125, -2.070709228515625, -1.94873046875, -1.826751708984375, -1.70477294921875, -1.582794189453125, -1.4608154296875, -1.338836669921875, -1.21685791015625, -1.094879150390625, -0.972900390625, -0.850921630859375, -0.72894287109375, -0.606964111328125, -0.4849853515625, -0.363006591796875, -0.24102783203125, -0.119049072265625, 0.0029296875, 0.124908447265625, 0.24688720703125, 0.368865966796875, 0.4908447265625, 0.612823486328125, 0.73480224609375, 0.856781005859375, 0.978759765625, 1.100738525390625, 1.22271728515625, 1.344696044921875, 1.4666748046875, 1.588653564453125, 1.71063232421875, 1.832611083984375, 1.95458984375, 2.076568603515625, 2.19854736328125, 2.320526123046875, 2.4425048828125, 2.564483642578125, 2.68646240234375, 2.808441162109375, 2.930419921875, 3.052398681640625, 3.17437744140625, 3.296356201171875, 3.4183349609375, 3.540313720703125, 3.66229248046875, 3.784271240234375, 3.90625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 5.0, 5.0, 7.0, 8.0, 16.0, 19.0, 14.0, 22.0, 30.0, 26.0, 36.0, 37.0, 42.0, 43.0, 46.0, 62.0, 52.0, 65.0, 46.0, 47.0, 37.0, 37.0, 35.0, 45.0, 31.0, 32.0, 26.0, 30.0, 24.0, 15.0, 13.0, 12.0, 12.0, 8.0, 1.0, 5.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.734375, -2.636199951171875, -2.53802490234375, -2.439849853515625, -2.3416748046875, -2.243499755859375, -2.14532470703125, -2.047149658203125, -1.948974609375, -1.850799560546875, -1.75262451171875, -1.654449462890625, -1.5562744140625, -1.458099365234375, -1.35992431640625, -1.261749267578125, -1.16357421875, -1.065399169921875, -0.96722412109375, -0.869049072265625, -0.7708740234375, -0.672698974609375, -0.57452392578125, -0.476348876953125, -0.378173828125, -0.279998779296875, -0.18182373046875, -0.083648681640625, 0.0145263671875, 0.112701416015625, 0.21087646484375, 0.309051513671875, 0.4072265625, 0.505401611328125, 0.60357666015625, 0.701751708984375, 0.7999267578125, 0.898101806640625, 0.99627685546875, 1.094451904296875, 1.192626953125, 1.290802001953125, 1.38897705078125, 1.487152099609375, 1.5853271484375, 1.683502197265625, 1.78167724609375, 1.879852294921875, 1.97802734375, 2.076202392578125, 2.17437744140625, 2.272552490234375, 2.3707275390625, 2.468902587890625, 2.56707763671875, 2.665252685546875, 2.763427734375, 2.861602783203125, 2.95977783203125, 3.057952880859375, 3.1561279296875, 3.254302978515625, 3.35247802734375, 3.450653076171875, 3.548828125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 12.0, 6.0, 22.0, 18.0, 26.0, 51.0, 82.0, 100.0, 204.0, 365.0, 684.0, 1265.0, 3342.0, 12680.0, 104087.0, 827427.0, 81475.0, 10748.0, 3145.0, 1219.0, 637.0, 345.0, 204.0, 118.0, 80.0, 53.0, 38.0, 26.0, 24.0, 11.0, 12.0, 8.0, 6.0, 3.0, 3.0, 1.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.0078125, -11.6593017578125, -11.310791015625, -10.9622802734375, -10.61376953125, -10.2652587890625, -9.916748046875, -9.5682373046875, -9.2197265625, -8.8712158203125, -8.522705078125, -8.1741943359375, -7.82568359375, -7.4771728515625, -7.128662109375, -6.7801513671875, -6.431640625, -6.0831298828125, -5.734619140625, -5.3861083984375, -5.03759765625, -4.6890869140625, -4.340576171875, -3.9920654296875, -3.6435546875, -3.2950439453125, -2.946533203125, -2.5980224609375, -2.24951171875, -1.9010009765625, -1.552490234375, -1.2039794921875, -0.85546875, -0.5069580078125, -0.158447265625, 0.1900634765625, 0.53857421875, 0.8870849609375, 1.235595703125, 1.5841064453125, 1.9326171875, 2.2811279296875, 2.629638671875, 2.9781494140625, 3.32666015625, 3.6751708984375, 4.023681640625, 4.3721923828125, 4.720703125, 5.0692138671875, 5.417724609375, 5.7662353515625, 6.11474609375, 6.4632568359375, 6.811767578125, 7.1602783203125, 7.5087890625, 7.8572998046875, 8.205810546875, 8.5543212890625, 8.90283203125, 9.2513427734375, 9.599853515625, 9.9483642578125, 10.296875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 18.0, 22.0, 23.0, 25.0, 39.0, 50.0, 49.0, 71.0, 73.0, 67.0, 82.0, 65.0, 73.0, 57.0, 48.0, 41.0, 41.0, 27.0, 25.0, 20.0, 12.0, 13.0, 9.0, 10.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.4453125, -14.984375, -14.5234375, -14.0625, -13.6015625, -13.140625, -12.6796875, -12.21875, -11.7578125, -11.296875, -10.8359375, -10.375, -9.9140625, -9.453125, -8.9921875, -8.53125, -8.0703125, -7.609375, -7.1484375, -6.6875, -6.2265625, -5.765625, -5.3046875, -4.84375, -4.3828125, -3.921875, -3.4609375, -3.0, -2.5390625, -2.078125, -1.6171875, -1.15625, -0.6953125, -0.234375, 0.2265625, 0.6875, 1.1484375, 1.609375, 2.0703125, 2.53125, 2.9921875, 3.453125, 3.9140625, 4.375, 4.8359375, 5.296875, 5.7578125, 6.21875, 6.6796875, 7.140625, 7.6015625, 8.0625, 8.5234375, 8.984375, 9.4453125, 9.90625, 10.3671875, 10.828125, 11.2890625, 11.75, 12.2109375, 12.671875, 13.1328125, 13.59375, 14.0546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 12.0, 12.0, 18.0, 39.0, 40.0, 77.0, 99.0, 172.0, 353.0, 630.0, 1575.0, 4370.0, 15819.0, 81555.0, 699354.0, 200837.0, 31406.0, 7720.0, 2381.0, 1001.0, 447.0, 232.0, 125.0, 86.0, 41.0, 48.0, 37.0, 18.0, 10.0, 7.0, 6.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-2.203125, -2.13580322265625, -2.0684814453125, -2.00115966796875, -1.933837890625, -1.86651611328125, -1.7991943359375, -1.73187255859375, -1.66455078125, -1.59722900390625, -1.5299072265625, -1.46258544921875, -1.395263671875, -1.32794189453125, -1.2606201171875, -1.19329833984375, -1.1259765625, -1.05865478515625, -0.9913330078125, -0.92401123046875, -0.856689453125, -0.78936767578125, -0.7220458984375, -0.65472412109375, -0.58740234375, -0.52008056640625, -0.4527587890625, -0.38543701171875, -0.318115234375, -0.25079345703125, -0.1834716796875, -0.11614990234375, -0.048828125, 0.01849365234375, 0.0858154296875, 0.15313720703125, 0.220458984375, 0.28778076171875, 0.3551025390625, 0.42242431640625, 0.48974609375, 0.55706787109375, 0.6243896484375, 0.69171142578125, 0.759033203125, 0.82635498046875, 0.8936767578125, 0.96099853515625, 1.0283203125, 1.09564208984375, 1.1629638671875, 1.23028564453125, 1.297607421875, 1.36492919921875, 1.4322509765625, 1.49957275390625, 1.56689453125, 1.63421630859375, 1.7015380859375, 1.76885986328125, 1.836181640625, 1.90350341796875, 1.9708251953125, 2.03814697265625, 2.10546875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 3.0, 11.0, 7.0, 16.0, 19.0, 18.0, 32.0, 37.0, 35.0, 67.0, 69.0, 98.0, 101.0, 103.0, 101.0, 71.0, 55.0, 47.0, 27.0, 30.0, 10.0, 12.0, 11.0, 7.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.000774383544921875, -0.000754963606595993, -0.0007355436682701111, -0.0007161237299442291, -0.0006967037916183472, -0.0006772838532924652, -0.0006578639149665833, -0.0006384439766407013, -0.0006190240383148193, -0.0005996040999889374, -0.0005801841616630554, -0.0005607642233371735, -0.0005413442850112915, -0.0005219243466854095, -0.0005025044083595276, -0.00048308447003364563, -0.00046366453170776367, -0.0004442445933818817, -0.00042482465505599976, -0.0004054047167301178, -0.00038598477840423584, -0.0003665648400783539, -0.0003471449017524719, -0.00032772496342658997, -0.000308305025100708, -0.00028888508677482605, -0.0002694651484489441, -0.00025004521012306213, -0.00023062527179718018, -0.00021120533347129822, -0.00019178539514541626, -0.0001723654568195343, -0.00015294551849365234, -0.00013352558016777039, -0.00011410564184188843, -9.468570351600647e-05, -7.526576519012451e-05, -5.5845826864242554e-05, -3.6425888538360596e-05, -1.7005950212478638e-05, 2.4139881134033203e-06, 2.183392643928528e-05, 4.1253864765167236e-05, 6.0673803091049194e-05, 8.009374141693115e-05, 9.951367974281311e-05, 0.00011893361806869507, 0.00013835355639457703, 0.00015777349472045898, 0.00017719343304634094, 0.0001966133713722229, 0.00021603330969810486, 0.00023545324802398682, 0.0002548731863498688, 0.00027429312467575073, 0.0002937130630016327, 0.00031313300132751465, 0.0003325529396533966, 0.00035197287797927856, 0.0003713928163051605, 0.0003908127546310425, 0.00041023269295692444, 0.0004296526312828064, 0.00044907256960868835, 0.0004684925079345703]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 0.0, 2.0, 4.0, 5.0, 6.0, 8.0, 13.0, 19.0, 26.0, 19.0, 43.0, 58.0, 105.0, 164.0, 322.0, 669.0, 1500.0, 4660.0, 22649.0, 221553.0, 729513.0, 54168.0, 8592.0, 2422.0, 931.0, 471.0, 222.0, 142.0, 84.0, 54.0, 33.0, 30.0, 13.0, 15.0, 16.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.146484375, -2.070404052734375, -1.99432373046875, -1.918243408203125, -1.8421630859375, -1.766082763671875, -1.69000244140625, -1.613922119140625, -1.537841796875, -1.461761474609375, -1.38568115234375, -1.309600830078125, -1.2335205078125, -1.157440185546875, -1.08135986328125, -1.005279541015625, -0.92919921875, -0.853118896484375, -0.77703857421875, -0.700958251953125, -0.6248779296875, -0.548797607421875, -0.47271728515625, -0.396636962890625, -0.320556640625, -0.244476318359375, -0.16839599609375, -0.092315673828125, -0.0162353515625, 0.059844970703125, 0.13592529296875, 0.212005615234375, 0.2880859375, 0.364166259765625, 0.44024658203125, 0.516326904296875, 0.5924072265625, 0.668487548828125, 0.74456787109375, 0.820648193359375, 0.896728515625, 0.972808837890625, 1.04888916015625, 1.124969482421875, 1.2010498046875, 1.277130126953125, 1.35321044921875, 1.429290771484375, 1.50537109375, 1.581451416015625, 1.65753173828125, 1.733612060546875, 1.8096923828125, 1.885772705078125, 1.96185302734375, 2.037933349609375, 2.114013671875, 2.190093994140625, 2.26617431640625, 2.342254638671875, 2.4183349609375, 2.494415283203125, 2.57049560546875, 2.646575927734375, 2.72265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 4.0, 9.0, 16.0, 13.0, 25.0, 43.0, 46.0, 75.0, 70.0, 115.0, 100.0, 98.0, 71.0, 75.0, 59.0, 39.0, 38.0, 22.0, 23.0, 9.0, 8.0, 7.0, 7.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.36187744140625, -2.2921142578125, -2.22235107421875, -2.152587890625, -2.08282470703125, -2.0130615234375, -1.94329833984375, -1.87353515625, -1.80377197265625, -1.7340087890625, -1.66424560546875, -1.594482421875, -1.52471923828125, -1.4549560546875, -1.38519287109375, -1.3154296875, -1.24566650390625, -1.1759033203125, -1.10614013671875, -1.036376953125, -0.96661376953125, -0.8968505859375, -0.82708740234375, -0.75732421875, -0.68756103515625, -0.6177978515625, -0.54803466796875, -0.478271484375, -0.40850830078125, -0.3387451171875, -0.26898193359375, -0.19921875, -0.12945556640625, -0.0596923828125, 0.01007080078125, 0.079833984375, 0.14959716796875, 0.2193603515625, 0.28912353515625, 0.35888671875, 0.42864990234375, 0.4984130859375, 0.56817626953125, 0.637939453125, 0.70770263671875, 0.7774658203125, 0.84722900390625, 0.9169921875, 0.98675537109375, 1.0565185546875, 1.12628173828125, 1.196044921875, 1.26580810546875, 1.3355712890625, 1.40533447265625, 1.47509765625, 1.54486083984375, 1.6146240234375, 1.68438720703125, 1.754150390625, 1.82391357421875, 1.8936767578125, 1.96343994140625, 2.033203125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 14.0, 14.0, 28.0, 57.0, 95.0, 181.0, 332.0, 139.0, 72.0, 29.0, 17.0, 15.0, 6.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.92735290527344, -81.94813537597656, -79.96892547607422, -77.98970794677734, -76.01049041748047, -74.03128051757812, -72.05206298828125, -70.07284545898438, -68.0936279296875, -66.11441040039062, -64.13520050048828, -62.155982971191406, -60.17676544189453, -58.19755172729492, -56.21833801269531, -54.23912048339844, -52.259910583496094, -50.280696868896484, -48.30147933959961, -46.322265625, -44.343048095703125, -42.363834381103516, -40.384620666503906, -38.40540313720703, -36.42618942260742, -34.44697570800781, -32.46775817871094, -30.488544464111328, -28.509328842163086, -26.530113220214844, -24.550899505615234, -22.571683883666992, -20.59246826171875, -18.613252639770508, -16.634037017822266, -14.654823303222656, -12.675607681274414, -10.696392059326172, -8.717177391052246, -6.73796272277832, -4.758747100830078, -2.779531955718994, -0.8003168106079102, 1.1788983345031738, 3.158113479614258, 5.1373291015625, 7.116543769836426, 9.095758438110352, 11.074974060058594, 13.054189682006836, 15.033404350280762, 17.012619018554688, 18.99183464050293, 20.971050262451172, 22.95026397705078, 24.929479598999023, 26.908695220947266, 28.887910842895508, 30.86712646484375, 32.84634017944336, 34.82555389404297, 36.804771423339844, 38.78398513793945, 40.76319885253906, 42.74241638183594]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 10.0, 13.0, 14.0, 21.0, 18.0, 27.0, 20.0, 27.0, 28.0, 38.0, 41.0, 49.0, 74.0, 113.0, 121.0, 59.0, 38.0, 39.0, 41.0, 32.0, 16.0, 15.0, 19.0, 17.0, 23.0, 13.0, 14.0, 12.0, 6.0, 3.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-49.653133392333984, -48.226802825927734, -46.800472259521484, -45.3741455078125, -43.94781494140625, -42.521484375, -41.09515380859375, -39.6688232421875, -38.24249267578125, -36.816162109375, -35.38983154296875, -33.9635009765625, -32.537174224853516, -31.110843658447266, -29.684513092041016, -28.258182525634766, -26.83185386657715, -25.4055233001709, -23.97919464111328, -22.55286407470703, -21.12653350830078, -19.70020294189453, -18.273874282836914, -16.847543716430664, -15.42121410369873, -13.994884490966797, -12.568553924560547, -11.142224311828613, -9.71589469909668, -8.28956413269043, -6.863234519958496, -5.436903953552246, -4.0105743408203125, -2.5842442512512207, -1.157914400100708, 0.2684154510498047, 1.6947455406188965, 3.1210756301879883, 4.547405242919922, 5.973735809326172, 7.4000654220581055, 8.826395034790039, 10.252725601196289, 11.679055213928223, 13.105384826660156, 14.531715393066406, 15.95804500579834, 17.384376525878906, 18.810705184936523, 20.237035751342773, 21.66336441040039, 23.08969497680664, 24.51602554321289, 25.94235610961914, 27.368684768676758, 28.795015335083008, 30.221343994140625, 31.647674560546875, 33.074005126953125, 34.500335693359375, 35.92666244506836, 37.35299301147461, 38.77932357788086, 40.20565414428711, 41.63198471069336]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 8.0, 3.0, 9.0, 13.0, 14.0, 22.0, 38.0, 42.0, 66.0, 65.0, 105.0, 152.0, 229.0, 337.0, 485.0, 752.0, 1263.0, 2284.0, 4880.0, 11763.0, 36024.0, 119608.0, 436927.0, 1543647.0, 1488896.0, 401318.0, 99984.0, 26858.0, 9242.0, 3751.0, 1950.0, 1168.0, 741.0, 471.0, 316.0, 231.0, 163.0, 132.0, 88.0, 69.0, 50.0, 33.0, 26.0, 22.0, 10.0, 9.0, 7.0, 6.0, 4.0, 4.0, 1.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.494140625, -2.41357421875, -2.3330078125, -2.25244140625, -2.171875, -2.09130859375, -2.0107421875, -1.93017578125, -1.849609375, -1.76904296875, -1.6884765625, -1.60791015625, -1.52734375, -1.44677734375, -1.3662109375, -1.28564453125, -1.205078125, -1.12451171875, -1.0439453125, -0.96337890625, -0.8828125, -0.80224609375, -0.7216796875, -0.64111328125, -0.560546875, -0.47998046875, -0.3994140625, -0.31884765625, -0.23828125, -0.15771484375, -0.0771484375, 0.00341796875, 0.083984375, 0.16455078125, 0.2451171875, 0.32568359375, 0.40625, 0.48681640625, 0.5673828125, 0.64794921875, 0.728515625, 0.80908203125, 0.8896484375, 0.97021484375, 1.05078125, 1.13134765625, 1.2119140625, 1.29248046875, 1.373046875, 1.45361328125, 1.5341796875, 1.61474609375, 1.6953125, 1.77587890625, 1.8564453125, 1.93701171875, 2.017578125, 2.09814453125, 2.1787109375, 2.25927734375, 2.33984375, 2.42041015625, 2.5009765625, 2.58154296875, 2.662109375]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 8.0, 6.0, 9.0, 13.0, 20.0, 17.0, 30.0, 29.0, 25.0, 32.0, 38.0, 32.0, 47.0, 58.0, 56.0, 49.0, 44.0, 45.0, 61.0, 59.0, 41.0, 31.0, 35.0, 34.0, 31.0, 24.0, 20.0, 18.0, 14.0, 13.0, 16.0, 7.0, 8.0, 3.0, 7.0, 11.0, 0.0, 5.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.724609375, -2.619354248046875, -2.51409912109375, -2.408843994140625, -2.3035888671875, -2.198333740234375, -2.09307861328125, -1.987823486328125, -1.882568359375, -1.777313232421875, -1.67205810546875, -1.566802978515625, -1.4615478515625, -1.356292724609375, -1.25103759765625, -1.145782470703125, -1.04052734375, -0.935272216796875, -0.83001708984375, -0.724761962890625, -0.6195068359375, -0.514251708984375, -0.40899658203125, -0.303741455078125, -0.198486328125, -0.093231201171875, 0.01202392578125, 0.117279052734375, 0.2225341796875, 0.327789306640625, 0.43304443359375, 0.538299560546875, 0.6435546875, 0.748809814453125, 0.85406494140625, 0.959320068359375, 1.0645751953125, 1.169830322265625, 1.27508544921875, 1.380340576171875, 1.485595703125, 1.590850830078125, 1.69610595703125, 1.801361083984375, 1.9066162109375, 2.011871337890625, 2.11712646484375, 2.222381591796875, 2.32763671875, 2.432891845703125, 2.53814697265625, 2.643402099609375, 2.7486572265625, 2.853912353515625, 2.95916748046875, 3.064422607421875, 3.169677734375, 3.274932861328125, 3.38018798828125, 3.485443115234375, 3.5906982421875, 3.695953369140625, 3.80120849609375, 3.906463623046875, 4.01171875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 7.0, 11.0, 9.0, 10.0, 30.0, 75.0, 167.0, 378.0, 1210.0, 11254.0, 3974040.0, 202630.0, 3473.0, 627.0, 201.0, 90.0, 37.0, 13.0, 12.0, 7.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.78125, -25.21826171875, -24.6552734375, -24.09228515625, -23.529296875, -22.96630859375, -22.4033203125, -21.84033203125, -21.27734375, -20.71435546875, -20.1513671875, -19.58837890625, -19.025390625, -18.46240234375, -17.8994140625, -17.33642578125, -16.7734375, -16.21044921875, -15.6474609375, -15.08447265625, -14.521484375, -13.95849609375, -13.3955078125, -12.83251953125, -12.26953125, -11.70654296875, -11.1435546875, -10.58056640625, -10.017578125, -9.45458984375, -8.8916015625, -8.32861328125, -7.765625, -7.20263671875, -6.6396484375, -6.07666015625, -5.513671875, -4.95068359375, -4.3876953125, -3.82470703125, -3.26171875, -2.69873046875, -2.1357421875, -1.57275390625, -1.009765625, -0.44677734375, 0.1162109375, 0.67919921875, 1.2421875, 1.80517578125, 2.3681640625, 2.93115234375, 3.494140625, 4.05712890625, 4.6201171875, 5.18310546875, 5.74609375, 6.30908203125, 6.8720703125, 7.43505859375, 7.998046875, 8.56103515625, 9.1240234375, 9.68701171875, 10.25]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 11.0, 18.0, 36.0, 63.0, 107.0, 221.0, 511.0, 1062.0, 1098.0, 539.0, 203.0, 85.0, 36.0, 30.0, 13.0, 13.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0], "bins": [-15.59375, -15.27520751953125, -14.9566650390625, -14.63812255859375, -14.319580078125, -14.00103759765625, -13.6824951171875, -13.36395263671875, -13.04541015625, -12.72686767578125, -12.4083251953125, -12.08978271484375, -11.771240234375, -11.45269775390625, -11.1341552734375, -10.81561279296875, -10.4970703125, -10.17852783203125, -9.8599853515625, -9.54144287109375, -9.222900390625, -8.90435791015625, -8.5858154296875, -8.26727294921875, -7.94873046875, -7.63018798828125, -7.3116455078125, -6.99310302734375, -6.674560546875, -6.35601806640625, -6.0374755859375, -5.71893310546875, -5.400390625, -5.08184814453125, -4.7633056640625, -4.44476318359375, -4.126220703125, -3.80767822265625, -3.4891357421875, -3.17059326171875, -2.85205078125, -2.53350830078125, -2.2149658203125, -1.89642333984375, -1.577880859375, -1.25933837890625, -0.9407958984375, -0.62225341796875, -0.3037109375, 0.01483154296875, 0.3333740234375, 0.65191650390625, 0.970458984375, 1.28900146484375, 1.6075439453125, 1.92608642578125, 2.24462890625, 2.56317138671875, 2.8817138671875, 3.20025634765625, 3.518798828125, 3.83734130859375, 4.1558837890625, 4.47442626953125, 4.79296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 10.0, 10.0, 17.0, 41.0, 82.0, 151.0, 236.0, 215.0, 108.0, 60.0, 34.0, 15.0, 7.0, 3.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.2088623046875, -90.16050720214844, -88.11214447021484, -86.06378936767578, -84.01542663574219, -81.96707153320312, -79.91870880126953, -77.87035369873047, -75.82199096679688, -73.77363586425781, -71.72527313232422, -69.67691802978516, -67.62855529785156, -65.5802001953125, -63.531837463378906, -61.483482360839844, -59.435123443603516, -57.38676452636719, -55.33840560913086, -53.29004669189453, -51.2416877746582, -49.193328857421875, -47.14497375488281, -45.09661102294922, -43.048255920410156, -40.99989700317383, -38.9515380859375, -36.90317916870117, -34.854820251464844, -32.806461334228516, -30.75810432434082, -28.709745407104492, -26.661380767822266, -24.613021850585938, -22.56466293334961, -20.51630401611328, -18.467945098876953, -16.419586181640625, -14.37122917175293, -12.322870254516602, -10.274511337280273, -8.226152420043945, -6.177793979644775, -4.1294355392456055, -2.0810766220092773, -0.03271770477294922, 2.0156402587890625, 4.063999176025391, 6.112358093261719, 8.160717010498047, 10.209075927734375, 12.257433891296387, 14.305792808532715, 16.35415267944336, 18.402509689331055, 20.450868606567383, 22.49922752380371, 24.54758644104004, 26.595945358276367, 28.644302368164062, 30.69266128540039, 32.74102020263672, 34.78937911987305, 36.837738037109375, 38.8860969543457]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 3.0, 2.0, 1.0, 5.0, 4.0, 6.0, 7.0, 14.0, 7.0, 11.0, 11.0, 17.0, 23.0, 31.0, 34.0, 34.0, 46.0, 53.0, 50.0, 47.0, 46.0, 62.0, 40.0, 53.0, 41.0, 42.0, 36.0, 33.0, 37.0, 34.0, 25.0, 29.0, 27.0, 13.0, 16.0, 16.0, 10.0, 10.0, 2.0, 5.0, 6.0, 12.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.014888763427734, -31.00702476501465, -29.99915885925293, -28.991294860839844, -27.983428955078125, -26.97556495666504, -25.967700958251953, -24.959835052490234, -23.95197105407715, -22.944107055664062, -21.936241149902344, -20.928377151489258, -19.920513153076172, -18.912647247314453, -17.904783248901367, -16.89691925048828, -15.889053344726562, -14.88118839263916, -13.873323440551758, -12.865459442138672, -11.85759449005127, -10.849729537963867, -9.841865539550781, -8.834000587463379, -7.826135635375977, -6.818270683288574, -5.81040620803833, -4.802541732788086, -3.7946767807006836, -2.7868118286132812, -1.778947353363037, -0.771082878112793, 0.23677825927734375, 1.244642972946167, 2.2525076866149902, 3.2603724002838135, 4.268237113952637, 5.276102066040039, 6.283966541290283, 7.291831016540527, 8.29969596862793, 9.307560920715332, 10.315425872802734, 11.32328987121582, 12.331154823303223, 13.339019775390625, 14.346883773803711, 15.354748725891113, 16.362613677978516, 17.3704776763916, 18.37834358215332, 19.386207580566406, 20.394073486328125, 21.40193748474121, 22.409801483154297, 23.417667388916016, 24.4255313873291, 25.433395385742188, 26.441261291503906, 27.449125289916992, 28.456989288330078, 29.464855194091797, 30.472719192504883, 31.48058319091797, 32.48844909667969]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 4.0, 11.0, 17.0, 23.0, 22.0, 30.0, 53.0, 79.0, 105.0, 167.0, 239.0, 338.0, 605.0, 969.0, 1519.0, 2844.0, 5332.0, 10154.0, 21382.0, 49098.0, 130493.0, 385983.0, 275719.0, 92142.0, 36779.0, 16245.0, 7949.0, 4201.0, 2321.0, 1364.0, 831.0, 520.0, 305.0, 221.0, 167.0, 94.0, 67.0, 44.0, 23.0, 27.0, 23.0, 18.0, 10.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 3.0], "bins": [-5.9375, -5.77178955078125, -5.6060791015625, -5.44036865234375, -5.274658203125, -5.10894775390625, -4.9432373046875, -4.77752685546875, -4.61181640625, -4.44610595703125, -4.2803955078125, -4.11468505859375, -3.948974609375, -3.78326416015625, -3.6175537109375, -3.45184326171875, -3.2861328125, -3.12042236328125, -2.9547119140625, -2.78900146484375, -2.623291015625, -2.45758056640625, -2.2918701171875, -2.12615966796875, -1.96044921875, -1.79473876953125, -1.6290283203125, -1.46331787109375, -1.297607421875, -1.13189697265625, -0.9661865234375, -0.80047607421875, -0.634765625, -0.46905517578125, -0.3033447265625, -0.13763427734375, 0.028076171875, 0.19378662109375, 0.3594970703125, 0.52520751953125, 0.69091796875, 0.85662841796875, 1.0223388671875, 1.18804931640625, 1.353759765625, 1.51947021484375, 1.6851806640625, 1.85089111328125, 2.0166015625, 2.18231201171875, 2.3480224609375, 2.51373291015625, 2.679443359375, 2.84515380859375, 3.0108642578125, 3.17657470703125, 3.34228515625, 3.50799560546875, 3.6737060546875, 3.83941650390625, 4.005126953125, 4.17083740234375, 4.3365478515625, 4.50225830078125, 4.66796875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 4.0, 3.0, 11.0, 6.0, 15.0, 15.0, 23.0, 14.0, 36.0, 26.0, 50.0, 46.0, 39.0, 49.0, 52.0, 67.0, 57.0, 53.0, 63.0, 56.0, 50.0, 28.0, 42.0, 32.0, 33.0, 20.0, 13.0, 14.0, 18.0, 10.0, 11.0, 10.0, 12.0, 6.0, 5.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.38671875, -3.26556396484375, -3.1444091796875, -3.02325439453125, -2.902099609375, -2.78094482421875, -2.6597900390625, -2.53863525390625, -2.41748046875, -2.29632568359375, -2.1751708984375, -2.05401611328125, -1.932861328125, -1.81170654296875, -1.6905517578125, -1.56939697265625, -1.4482421875, -1.32708740234375, -1.2059326171875, -1.08477783203125, -0.963623046875, -0.84246826171875, -0.7213134765625, -0.60015869140625, -0.47900390625, -0.35784912109375, -0.2366943359375, -0.11553955078125, 0.005615234375, 0.12677001953125, 0.2479248046875, 0.36907958984375, 0.490234375, 0.61138916015625, 0.7325439453125, 0.85369873046875, 0.974853515625, 1.09600830078125, 1.2171630859375, 1.33831787109375, 1.45947265625, 1.58062744140625, 1.7017822265625, 1.82293701171875, 1.944091796875, 2.06524658203125, 2.1864013671875, 2.30755615234375, 2.4287109375, 2.54986572265625, 2.6710205078125, 2.79217529296875, 2.913330078125, 3.03448486328125, 3.1556396484375, 3.27679443359375, 3.39794921875, 3.51910400390625, 3.6402587890625, 3.76141357421875, 3.882568359375, 4.00372314453125, 4.1248779296875, 4.24603271484375, 4.3671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 8.0, 7.0, 1.0, 7.0, 6.0, 12.0, 15.0, 19.0, 15.0, 31.0, 40.0, 65.0, 95.0, 133.0, 183.0, 264.0, 416.0, 628.0, 1111.0, 2261.0, 6317.0, 28952.0, 623896.0, 346288.0, 26787.0, 5927.0, 2239.0, 993.0, 616.0, 409.0, 245.0, 165.0, 115.0, 77.0, 70.0, 42.0, 36.0, 13.0, 15.0, 14.0, 8.0, 7.0, 3.0, 4.0, 4.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.4296875, -11.072265625, -10.71484375, -10.357421875, -10.0, -9.642578125, -9.28515625, -8.927734375, -8.5703125, -8.212890625, -7.85546875, -7.498046875, -7.140625, -6.783203125, -6.42578125, -6.068359375, -5.7109375, -5.353515625, -4.99609375, -4.638671875, -4.28125, -3.923828125, -3.56640625, -3.208984375, -2.8515625, -2.494140625, -2.13671875, -1.779296875, -1.421875, -1.064453125, -0.70703125, -0.349609375, 0.0078125, 0.365234375, 0.72265625, 1.080078125, 1.4375, 1.794921875, 2.15234375, 2.509765625, 2.8671875, 3.224609375, 3.58203125, 3.939453125, 4.296875, 4.654296875, 5.01171875, 5.369140625, 5.7265625, 6.083984375, 6.44140625, 6.798828125, 7.15625, 7.513671875, 7.87109375, 8.228515625, 8.5859375, 8.943359375, 9.30078125, 9.658203125, 10.015625, 10.373046875, 10.73046875, 11.087890625, 11.4453125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 5.0, 10.0, 12.0, 18.0, 15.0, 25.0, 30.0, 30.0, 30.0, 53.0, 54.0, 75.0, 72.0, 76.0, 75.0, 66.0, 65.0, 60.0, 35.0, 32.0, 36.0, 28.0, 18.0, 16.0, 19.0, 8.0, 11.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-18.421875, -17.9090576171875, -17.396240234375, -16.8834228515625, -16.37060546875, -15.8577880859375, -15.344970703125, -14.8321533203125, -14.3193359375, -13.8065185546875, -13.293701171875, -12.7808837890625, -12.26806640625, -11.7552490234375, -11.242431640625, -10.7296142578125, -10.216796875, -9.7039794921875, -9.191162109375, -8.6783447265625, -8.16552734375, -7.6527099609375, -7.139892578125, -6.6270751953125, -6.1142578125, -5.6014404296875, -5.088623046875, -4.5758056640625, -4.06298828125, -3.5501708984375, -3.037353515625, -2.5245361328125, -2.01171875, -1.4989013671875, -0.986083984375, -0.4732666015625, 0.03955078125, 0.5523681640625, 1.065185546875, 1.5780029296875, 2.0908203125, 2.6036376953125, 3.116455078125, 3.6292724609375, 4.14208984375, 4.6549072265625, 5.167724609375, 5.6805419921875, 6.193359375, 6.7061767578125, 7.218994140625, 7.7318115234375, 8.24462890625, 8.7574462890625, 9.270263671875, 9.7830810546875, 10.2958984375, 10.8087158203125, 11.321533203125, 11.8343505859375, 12.34716796875, 12.8599853515625, 13.372802734375, 13.8856201171875, 14.3984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 6.0, 3.0, 6.0, 11.0, 18.0, 22.0, 25.0, 33.0, 45.0, 72.0, 87.0, 174.0, 270.0, 460.0, 790.0, 1583.0, 3650.0, 10856.0, 44205.0, 271772.0, 632048.0, 59926.0, 13845.0, 4561.0, 1869.0, 922.0, 506.0, 259.0, 186.0, 94.0, 77.0, 50.0, 29.0, 22.0, 21.0, 6.0, 17.0, 9.0, 5.0, 5.0, 2.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.51953125, -1.4706573486328125, -1.421783447265625, -1.3729095458984375, -1.32403564453125, -1.2751617431640625, -1.226287841796875, -1.1774139404296875, -1.1285400390625, -1.0796661376953125, -1.030792236328125, -0.9819183349609375, -0.93304443359375, -0.8841705322265625, -0.835296630859375, -0.7864227294921875, -0.737548828125, -0.6886749267578125, -0.639801025390625, -0.5909271240234375, -0.54205322265625, -0.4931793212890625, -0.444305419921875, -0.3954315185546875, -0.3465576171875, -0.2976837158203125, -0.248809814453125, -0.1999359130859375, -0.15106201171875, -0.1021881103515625, -0.053314208984375, -0.0044403076171875, 0.04443359375, 0.0933074951171875, 0.142181396484375, 0.1910552978515625, 0.23992919921875, 0.2888031005859375, 0.337677001953125, 0.3865509033203125, 0.4354248046875, 0.4842987060546875, 0.533172607421875, 0.5820465087890625, 0.63092041015625, 0.6797943115234375, 0.728668212890625, 0.7775421142578125, 0.826416015625, 0.8752899169921875, 0.924163818359375, 0.9730377197265625, 1.02191162109375, 1.0707855224609375, 1.119659423828125, 1.1685333251953125, 1.2174072265625, 1.2662811279296875, 1.315155029296875, 1.3640289306640625, 1.41290283203125, 1.4617767333984375, 1.510650634765625, 1.5595245361328125, 1.6083984375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 4.0, 6.0, 8.0, 9.0, 11.0, 9.0, 11.0, 15.0, 24.0, 23.0, 47.0, 45.0, 71.0, 94.0, 105.0, 85.0, 87.0, 75.0, 67.0, 43.0, 28.0, 21.0, 21.0, 15.0, 12.0, 9.0, 11.0, 8.0, 7.0, 4.0, 2.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00039958953857421875, -0.00038382411003112793, -0.0003680586814880371, -0.0003522932529449463, -0.00033652782440185547, -0.00032076239585876465, -0.00030499696731567383, -0.000289231538772583, -0.0002734661102294922, -0.00025770068168640137, -0.00024193525314331055, -0.00022616982460021973, -0.0002104043960571289, -0.00019463896751403809, -0.00017887353897094727, -0.00016310811042785645, -0.00014734268188476562, -0.0001315772533416748, -0.00011581182479858398, -0.00010004639625549316, -8.428096771240234e-05, -6.851553916931152e-05, -5.27501106262207e-05, -3.698468208312988e-05, -2.1219253540039062e-05, -5.453824996948242e-06, 1.0311603546142578e-05, 2.60770320892334e-05, 4.184246063232422e-05, 5.760788917541504e-05, 7.337331771850586e-05, 8.913874626159668e-05, 0.0001049041748046875, 0.00012066960334777832, 0.00013643503189086914, 0.00015220046043395996, 0.00016796588897705078, 0.0001837313175201416, 0.00019949674606323242, 0.00021526217460632324, 0.00023102760314941406, 0.0002467930316925049, 0.0002625584602355957, 0.0002783238887786865, 0.00029408931732177734, 0.00030985474586486816, 0.000325620174407959, 0.0003413856029510498, 0.0003571510314941406, 0.00037291646003723145, 0.00038868188858032227, 0.0004044473171234131, 0.0004202127456665039, 0.0004359781742095947, 0.00045174360275268555, 0.00046750903129577637, 0.0004832744598388672, 0.000499039888381958, 0.0005148053169250488, 0.0005305707454681396, 0.0005463361740112305, 0.0005621016025543213, 0.0005778670310974121, 0.0005936324596405029, 0.0006093978881835938]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 6.0, 6.0, 6.0, 12.0, 14.0, 12.0, 26.0, 28.0, 30.0, 41.0, 66.0, 80.0, 111.0, 167.0, 236.0, 387.0, 668.0, 1203.0, 2442.0, 6327.0, 23470.0, 134592.0, 728724.0, 117556.0, 21149.0, 5822.0, 2334.0, 1171.0, 622.0, 360.0, 280.0, 169.0, 107.0, 74.0, 69.0, 39.0, 25.0, 24.0, 25.0, 15.0, 15.0, 10.0, 9.0, 7.0, 6.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.376953125, -1.33319091796875, -1.2894287109375, -1.24566650390625, -1.201904296875, -1.15814208984375, -1.1143798828125, -1.07061767578125, -1.02685546875, -0.98309326171875, -0.9393310546875, -0.89556884765625, -0.851806640625, -0.80804443359375, -0.7642822265625, -0.72052001953125, -0.6767578125, -0.63299560546875, -0.5892333984375, -0.54547119140625, -0.501708984375, -0.45794677734375, -0.4141845703125, -0.37042236328125, -0.32666015625, -0.28289794921875, -0.2391357421875, -0.19537353515625, -0.151611328125, -0.10784912109375, -0.0640869140625, -0.02032470703125, 0.0234375, 0.06719970703125, 0.1109619140625, 0.15472412109375, 0.198486328125, 0.24224853515625, 0.2860107421875, 0.32977294921875, 0.37353515625, 0.41729736328125, 0.4610595703125, 0.50482177734375, 0.548583984375, 0.59234619140625, 0.6361083984375, 0.67987060546875, 0.7236328125, 0.76739501953125, 0.8111572265625, 0.85491943359375, 0.898681640625, 0.94244384765625, 0.9862060546875, 1.02996826171875, 1.07373046875, 1.11749267578125, 1.1612548828125, 1.20501708984375, 1.248779296875, 1.29254150390625, 1.3363037109375, 1.38006591796875, 1.423828125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 3.0, 7.0, 9.0, 10.0, 11.0, 23.0, 31.0, 44.0, 46.0, 60.0, 80.0, 104.0, 82.0, 103.0, 90.0, 64.0, 58.0, 46.0, 40.0, 14.0, 19.0, 22.0, 6.0, 8.0, 5.0, 8.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5986328125, -1.5409088134765625, -1.483184814453125, -1.4254608154296875, -1.36773681640625, -1.3100128173828125, -1.252288818359375, -1.1945648193359375, -1.1368408203125, -1.0791168212890625, -1.021392822265625, -0.9636688232421875, -0.90594482421875, -0.8482208251953125, -0.790496826171875, -0.7327728271484375, -0.675048828125, -0.6173248291015625, -0.559600830078125, -0.5018768310546875, -0.44415283203125, -0.3864288330078125, -0.328704833984375, -0.2709808349609375, -0.2132568359375, -0.1555328369140625, -0.097808837890625, -0.0400848388671875, 0.01763916015625, 0.0753631591796875, 0.133087158203125, 0.1908111572265625, 0.24853515625, 0.3062591552734375, 0.363983154296875, 0.4217071533203125, 0.47943115234375, 0.5371551513671875, 0.594879150390625, 0.6526031494140625, 0.7103271484375, 0.7680511474609375, 0.825775146484375, 0.8834991455078125, 0.94122314453125, 0.9989471435546875, 1.056671142578125, 1.1143951416015625, 1.172119140625, 1.2298431396484375, 1.287567138671875, 1.3452911376953125, 1.40301513671875, 1.4607391357421875, 1.518463134765625, 1.5761871337890625, 1.6339111328125, 1.6916351318359375, 1.749359130859375, 1.8070831298828125, 1.86480712890625, 1.9225311279296875, 1.980255126953125, 2.0379791259765625, 2.095703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 7.0, 6.0, 4.0, 4.0, 9.0, 10.0, 21.0, 17.0, 40.0, 44.0, 48.0, 56.0, 57.0, 100.0, 245.0, 98.0, 64.0, 53.0, 33.0, 19.0, 12.0, 9.0, 9.0, 7.0, 7.0, 8.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-37.40925598144531, -36.5287971496582, -35.648338317871094, -34.767879486083984, -33.887420654296875, -33.006961822509766, -32.126502990722656, -31.246044158935547, -30.365585327148438, -29.485126495361328, -28.60466766357422, -27.72420883178711, -26.84375, -25.96329116821289, -25.08283233642578, -24.202373504638672, -23.321914672851562, -22.441455841064453, -21.560997009277344, -20.680538177490234, -19.800079345703125, -18.919620513916016, -18.039161682128906, -17.158702850341797, -16.278244018554688, -15.397785186767578, -14.517326354980469, -13.63686752319336, -12.75640869140625, -11.87594985961914, -10.995491027832031, -10.115032196044922, -9.23457145690918, -8.35411262512207, -7.473653793334961, -6.593194961547852, -5.712736129760742, -4.832277297973633, -3.9518184661865234, -3.071359634399414, -2.1909008026123047, -1.3104419708251953, -0.42998313903808594, 0.45047569274902344, 1.3309345245361328, 2.211393356323242, 3.0918521881103516, 3.972311019897461, 4.85276985168457, 5.73322868347168, 6.613687515258789, 7.494146347045898, 8.374605178833008, 9.255064010620117, 10.135522842407227, 11.015981674194336, 11.896440505981445, 12.776899337768555, 13.657358169555664, 14.537817001342773, 15.418275833129883, 16.298734664916992, 17.1791934967041, 18.05965232849121, 18.94011116027832]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 6.0, 3.0, 2.0, 6.0, 6.0, 14.0, 11.0, 19.0, 23.0, 15.0, 17.0, 22.0, 26.0, 23.0, 22.0, 25.0, 25.0, 34.0, 51.0, 87.0, 145.0, 91.0, 50.0, 47.0, 35.0, 21.0, 23.0, 14.0, 15.0, 18.0, 18.0, 11.0, 13.0, 11.0, 13.0, 7.0, 5.0, 2.0, 7.0, 4.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-43.098724365234375, -41.73188018798828, -40.36503601074219, -38.998191833496094, -37.631343841552734, -36.26449966430664, -34.89765548706055, -33.53081130981445, -32.16396713256836, -30.797122955322266, -29.43027687072754, -28.063432693481445, -26.69658851623535, -25.329742431640625, -23.96289825439453, -22.596054077148438, -21.22920799255371, -19.862363815307617, -18.49551773071289, -17.128673553466797, -15.761829376220703, -14.394984245300293, -13.028139114379883, -11.661294937133789, -10.294449806213379, -8.927604675292969, -7.560760498046875, -6.193915367126465, -4.827070713043213, -3.460226058959961, -2.093380928039551, -0.726536750793457, 0.6403083801269531, 2.007153034210205, 3.373997926712036, 4.740842819213867, 6.107687473297119, 7.474532127380371, 8.841377258300781, 10.208221435546875, 11.575066566467285, 12.941911697387695, 14.308755874633789, 15.6756010055542, 17.04244613647461, 18.409290313720703, 19.776134490966797, 21.14297866821289, 22.509824752807617, 23.87666893005371, 25.243515014648438, 26.61035919189453, 27.977203369140625, 29.34404754638672, 30.710893630981445, 32.077735900878906, 33.444583892822266, 34.81142807006836, 36.17827224731445, 37.54512023925781, 38.911964416503906, 40.27880859375, 41.645652770996094, 43.01249694824219, 44.37934112548828]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 4.0, 12.0, 15.0, 20.0, 37.0, 56.0, 56.0, 108.0, 145.0, 230.0, 394.0, 621.0, 1068.0, 1814.0, 3373.0, 7327.0, 18993.0, 74555.0, 331317.0, 1274421.0, 1804285.0, 520638.0, 111543.0, 26082.0, 7991.0, 3820.0, 2028.0, 1202.0, 719.0, 453.0, 315.0, 184.0, 136.0, 93.0, 63.0, 53.0, 28.0, 27.0, 20.0, 6.0, 11.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.54296875, -3.4171142578125, -3.291259765625, -3.1654052734375, -3.03955078125, -2.9136962890625, -2.787841796875, -2.6619873046875, -2.5361328125, -2.4102783203125, -2.284423828125, -2.1585693359375, -2.03271484375, -1.9068603515625, -1.781005859375, -1.6551513671875, -1.529296875, -1.4034423828125, -1.277587890625, -1.1517333984375, -1.02587890625, -0.9000244140625, -0.774169921875, -0.6483154296875, -0.5224609375, -0.3966064453125, -0.270751953125, -0.1448974609375, -0.01904296875, 0.1068115234375, 0.232666015625, 0.3585205078125, 0.484375, 0.6102294921875, 0.736083984375, 0.8619384765625, 0.98779296875, 1.1136474609375, 1.239501953125, 1.3653564453125, 1.4912109375, 1.6170654296875, 1.742919921875, 1.8687744140625, 1.99462890625, 2.1204833984375, 2.246337890625, 2.3721923828125, 2.498046875, 2.6239013671875, 2.749755859375, 2.8756103515625, 3.00146484375, 3.1273193359375, 3.253173828125, 3.3790283203125, 3.5048828125, 3.6307373046875, 3.756591796875, 3.8824462890625, 4.00830078125, 4.1341552734375, 4.260009765625, 4.3858642578125, 4.51171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 2.0, 12.0, 7.0, 13.0, 14.0, 20.0, 23.0, 15.0, 16.0, 29.0, 29.0, 36.0, 45.0, 55.0, 64.0, 58.0, 60.0, 55.0, 61.0, 57.0, 42.0, 39.0, 29.0, 38.0, 29.0, 28.0, 21.0, 14.0, 14.0, 22.0, 8.0, 6.0, 11.0, 6.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.03125, -2.9154052734375, -2.799560546875, -2.6837158203125, -2.56787109375, -2.4520263671875, -2.336181640625, -2.2203369140625, -2.1044921875, -1.9886474609375, -1.872802734375, -1.7569580078125, -1.64111328125, -1.5252685546875, -1.409423828125, -1.2935791015625, -1.177734375, -1.0618896484375, -0.946044921875, -0.8302001953125, -0.71435546875, -0.5985107421875, -0.482666015625, -0.3668212890625, -0.2509765625, -0.1351318359375, -0.019287109375, 0.0965576171875, 0.21240234375, 0.3282470703125, 0.444091796875, 0.5599365234375, 0.67578125, 0.7916259765625, 0.907470703125, 1.0233154296875, 1.13916015625, 1.2550048828125, 1.370849609375, 1.4866943359375, 1.6025390625, 1.7183837890625, 1.834228515625, 1.9500732421875, 2.06591796875, 2.1817626953125, 2.297607421875, 2.4134521484375, 2.529296875, 2.6451416015625, 2.760986328125, 2.8768310546875, 2.99267578125, 3.1085205078125, 3.224365234375, 3.3402099609375, 3.4560546875, 3.5718994140625, 3.687744140625, 3.8035888671875, 3.91943359375, 4.0352783203125, 4.151123046875, 4.2669677734375, 4.3828125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 9.0, 3.0, 5.0, 16.0, 23.0, 31.0, 37.0, 57.0, 80.0, 179.0, 246.0, 514.0, 1200.0, 4260.0, 47310.0, 4024777.0, 106480.0, 6042.0, 1576.0, 606.0, 322.0, 172.0, 110.0, 70.0, 51.0, 36.0, 19.0, 15.0, 11.0, 9.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.03125, -16.5242919921875, -16.017333984375, -15.5103759765625, -15.00341796875, -14.4964599609375, -13.989501953125, -13.4825439453125, -12.9755859375, -12.4686279296875, -11.961669921875, -11.4547119140625, -10.94775390625, -10.4407958984375, -9.933837890625, -9.4268798828125, -8.919921875, -8.4129638671875, -7.906005859375, -7.3990478515625, -6.89208984375, -6.3851318359375, -5.878173828125, -5.3712158203125, -4.8642578125, -4.3572998046875, -3.850341796875, -3.3433837890625, -2.83642578125, -2.3294677734375, -1.822509765625, -1.3155517578125, -0.80859375, -0.3016357421875, 0.205322265625, 0.7122802734375, 1.21923828125, 1.7261962890625, 2.233154296875, 2.7401123046875, 3.2470703125, 3.7540283203125, 4.260986328125, 4.7679443359375, 5.27490234375, 5.7818603515625, 6.288818359375, 6.7957763671875, 7.302734375, 7.8096923828125, 8.316650390625, 8.8236083984375, 9.33056640625, 9.8375244140625, 10.344482421875, 10.8514404296875, 11.3583984375, 11.8653564453125, 12.372314453125, 12.8792724609375, 13.38623046875, 13.8931884765625, 14.400146484375, 14.9071044921875, 15.4140625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 6.0, 11.0, 10.0, 15.0, 24.0, 35.0, 50.0, 69.0, 86.0, 152.0, 207.0, 305.0, 543.0, 726.0, 583.0, 421.0, 256.0, 189.0, 106.0, 88.0, 51.0, 32.0, 31.0, 24.0, 15.0, 14.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.88671875, -7.59185791015625, -7.2969970703125, -7.00213623046875, -6.707275390625, -6.41241455078125, -6.1175537109375, -5.82269287109375, -5.52783203125, -5.23297119140625, -4.9381103515625, -4.64324951171875, -4.348388671875, -4.05352783203125, -3.7586669921875, -3.46380615234375, -3.1689453125, -2.87408447265625, -2.5792236328125, -2.28436279296875, -1.989501953125, -1.69464111328125, -1.3997802734375, -1.10491943359375, -0.81005859375, -0.51519775390625, -0.2203369140625, 0.07452392578125, 0.369384765625, 0.66424560546875, 0.9591064453125, 1.25396728515625, 1.548828125, 1.84368896484375, 2.1385498046875, 2.43341064453125, 2.728271484375, 3.02313232421875, 3.3179931640625, 3.61285400390625, 3.90771484375, 4.20257568359375, 4.4974365234375, 4.79229736328125, 5.087158203125, 5.38201904296875, 5.6768798828125, 5.97174072265625, 6.2666015625, 6.56146240234375, 6.8563232421875, 7.15118408203125, 7.446044921875, 7.74090576171875, 8.0357666015625, 8.33062744140625, 8.62548828125, 8.92034912109375, 9.2152099609375, 9.51007080078125, 9.804931640625, 10.09979248046875, 10.3946533203125, 10.68951416015625, 10.984375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 9.0, 5.0, 14.0, 39.0, 94.0, 164.0, 318.0, 185.0, 98.0, 41.0, 15.0, 11.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.60685729980469, -51.511802673339844, -47.416744232177734, -43.321685791015625, -39.22663116455078, -35.13157653808594, -31.036518096923828, -26.94146156311035, -22.846405029296875, -18.7513484954834, -14.656291961669922, -10.561235427856445, -6.466178894042969, -2.371122360229492, 1.7239341735839844, 5.818990707397461, 9.914047241210938, 14.009103775024414, 18.10416030883789, 22.199216842651367, 26.294273376464844, 30.38932991027832, 34.4843864440918, 38.579444885253906, 42.67449951171875, 46.769554138183594, 50.8646125793457, 54.95967102050781, 59.054725646972656, 63.1497802734375, 67.24484252929688, 71.33989715576172, 75.43496704101562, 79.53002166748047, 83.62507629394531, 87.72013854980469, 91.81519317626953, 95.91024780273438, 100.00531005859375, 104.1003646850586, 108.19541931152344, 112.29047393798828, 116.38552856445312, 120.4805908203125, 124.57564544677734, 128.6707000732422, 132.76576232910156, 136.86080932617188, 140.95587158203125, 145.05093383789062, 149.14598083496094, 153.2410430908203, 157.33609008789062, 161.43115234375, 165.52621459960938, 169.6212615966797, 173.71632385253906, 177.81138610839844, 181.90643310546875, 186.00149536132812, 190.0965576171875, 194.1916046142578, 198.2866668701172, 202.3817138671875, 206.47677612304688]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 14.0, 13.0, 15.0, 9.0, 18.0, 27.0, 24.0, 23.0, 33.0, 41.0, 37.0, 48.0, 39.0, 54.0, 50.0, 74.0, 64.0, 55.0, 39.0, 46.0, 36.0, 44.0, 26.0, 27.0, 21.0, 28.0, 15.0, 20.0, 16.0, 10.0, 4.0, 6.0, 4.0, 4.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.10715103149414, -45.554622650146484, -44.00209426879883, -42.44956588745117, -40.89703369140625, -39.344505310058594, -37.79197692871094, -36.23944854736328, -34.686920166015625, -33.13439178466797, -31.581863403320312, -30.029333114624023, -28.476804733276367, -26.92427635192871, -25.371746063232422, -23.819217681884766, -22.26668930053711, -20.714160919189453, -19.161632537841797, -17.609102249145508, -16.05657386779785, -14.504045486450195, -12.951516151428223, -11.39898681640625, -9.846458435058594, -8.293930053710938, -6.741400718688965, -5.18887186050415, -3.636343002319336, -2.0838141441345215, -0.531285285949707, 1.0212440490722656, 2.5737762451171875, 4.126305103302002, 5.678833961486816, 7.231362819671631, 8.783891677856445, 10.336420059204102, 11.888949394226074, 13.441478729248047, 14.994007110595703, 16.54653549194336, 18.099063873291016, 19.651594161987305, 21.20412254333496, 22.756650924682617, 24.309181213378906, 25.861709594726562, 27.41423797607422, 28.966766357421875, 30.51929473876953, 32.07182312011719, 33.624351501464844, 35.176883697509766, 36.72941207885742, 38.28194046020508, 39.834468841552734, 41.38699722290039, 42.93952560424805, 44.4920539855957, 46.044586181640625, 47.59711456298828, 49.14964294433594, 50.702171325683594, 52.25469970703125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 15.0, 16.0, 29.0, 48.0, 64.0, 146.0, 288.0, 638.0, 1539.0, 4343.0, 15419.0, 79769.0, 736363.0, 173266.0, 25981.0, 6698.0, 2203.0, 864.0, 401.0, 209.0, 96.0, 62.0, 38.0, 24.0, 9.0, 5.0, 7.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.18359375, -5.91094970703125, -5.6383056640625, -5.36566162109375, -5.093017578125, -4.82037353515625, -4.5477294921875, -4.27508544921875, -4.00244140625, -3.72979736328125, -3.4571533203125, -3.18450927734375, -2.911865234375, -2.63922119140625, -2.3665771484375, -2.09393310546875, -1.8212890625, -1.54864501953125, -1.2760009765625, -1.00335693359375, -0.730712890625, -0.45806884765625, -0.1854248046875, 0.08721923828125, 0.35986328125, 0.63250732421875, 0.9051513671875, 1.17779541015625, 1.450439453125, 1.72308349609375, 1.9957275390625, 2.26837158203125, 2.541015625, 2.81365966796875, 3.0863037109375, 3.35894775390625, 3.631591796875, 3.90423583984375, 4.1768798828125, 4.44952392578125, 4.72216796875, 4.99481201171875, 5.2674560546875, 5.54010009765625, 5.812744140625, 6.08538818359375, 6.3580322265625, 6.63067626953125, 6.9033203125, 7.17596435546875, 7.4486083984375, 7.72125244140625, 7.993896484375, 8.26654052734375, 8.5391845703125, 8.81182861328125, 9.08447265625, 9.35711669921875, 9.6297607421875, 9.90240478515625, 10.175048828125, 10.44769287109375, 10.7203369140625, 10.99298095703125, 11.265625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 0.0, 4.0, 1.0, 7.0, 4.0, 3.0, 8.0, 11.0, 12.0, 17.0, 16.0, 33.0, 31.0, 35.0, 42.0, 49.0, 52.0, 48.0, 56.0, 64.0, 65.0, 56.0, 39.0, 48.0, 37.0, 46.0, 32.0, 39.0, 24.0, 28.0, 21.0, 16.0, 10.0, 8.0, 8.0, 8.0, 8.0, 3.0, 1.0, 6.0, 1.0, 1.0, 6.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.759765625, -3.636871337890625, -3.51397705078125, -3.391082763671875, -3.2681884765625, -3.145294189453125, -3.02239990234375, -2.899505615234375, -2.776611328125, -2.653717041015625, -2.53082275390625, -2.407928466796875, -2.2850341796875, -2.162139892578125, -2.03924560546875, -1.916351318359375, -1.79345703125, -1.670562744140625, -1.54766845703125, -1.424774169921875, -1.3018798828125, -1.178985595703125, -1.05609130859375, -0.933197021484375, -0.810302734375, -0.687408447265625, -0.56451416015625, -0.441619873046875, -0.3187255859375, -0.195831298828125, -0.07293701171875, 0.049957275390625, 0.1728515625, 0.295745849609375, 0.41864013671875, 0.541534423828125, 0.6644287109375, 0.787322998046875, 0.91021728515625, 1.033111572265625, 1.156005859375, 1.278900146484375, 1.40179443359375, 1.524688720703125, 1.6475830078125, 1.770477294921875, 1.89337158203125, 2.016265869140625, 2.13916015625, 2.262054443359375, 2.38494873046875, 2.507843017578125, 2.6307373046875, 2.753631591796875, 2.87652587890625, 2.999420166015625, 3.122314453125, 3.245208740234375, 3.36810302734375, 3.490997314453125, 3.6138916015625, 3.736785888671875, 3.85968017578125, 3.982574462890625, 4.10546875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 8.0, 8.0, 22.0, 27.0, 32.0, 57.0, 88.0, 117.0, 175.0, 255.0, 456.0, 859.0, 1883.0, 5532.0, 24721.0, 797209.0, 190623.0, 18435.0, 4488.0, 1664.0, 757.0, 387.0, 228.0, 147.0, 96.0, 74.0, 54.0, 32.0, 28.0, 11.0, 17.0, 18.0, 8.0, 7.0, 3.0, 2.0, 4.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.0703125, -8.7861328125, -8.501953125, -8.2177734375, -7.93359375, -7.6494140625, -7.365234375, -7.0810546875, -6.796875, -6.5126953125, -6.228515625, -5.9443359375, -5.66015625, -5.3759765625, -5.091796875, -4.8076171875, -4.5234375, -4.2392578125, -3.955078125, -3.6708984375, -3.38671875, -3.1025390625, -2.818359375, -2.5341796875, -2.25, -1.9658203125, -1.681640625, -1.3974609375, -1.11328125, -0.8291015625, -0.544921875, -0.2607421875, 0.0234375, 0.3076171875, 0.591796875, 0.8759765625, 1.16015625, 1.4443359375, 1.728515625, 2.0126953125, 2.296875, 2.5810546875, 2.865234375, 3.1494140625, 3.43359375, 3.7177734375, 4.001953125, 4.2861328125, 4.5703125, 4.8544921875, 5.138671875, 5.4228515625, 5.70703125, 5.9912109375, 6.275390625, 6.5595703125, 6.84375, 7.1279296875, 7.412109375, 7.6962890625, 7.98046875, 8.2646484375, 8.548828125, 8.8330078125, 9.1171875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 6.0, 5.0, 8.0, 10.0, 9.0, 7.0, 6.0, 11.0, 28.0, 21.0, 18.0, 38.0, 31.0, 32.0, 61.0, 57.0, 82.0, 78.0, 71.0, 87.0, 60.0, 57.0, 35.0, 25.0, 26.0, 23.0, 16.0, 23.0, 16.0, 9.0, 7.0, 9.0, 6.0, 9.0, 1.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.21875, -15.711181640625, -15.20361328125, -14.696044921875, -14.1884765625, -13.680908203125, -13.17333984375, -12.665771484375, -12.158203125, -11.650634765625, -11.14306640625, -10.635498046875, -10.1279296875, -9.620361328125, -9.11279296875, -8.605224609375, -8.09765625, -7.590087890625, -7.08251953125, -6.574951171875, -6.0673828125, -5.559814453125, -5.05224609375, -4.544677734375, -4.037109375, -3.529541015625, -3.02197265625, -2.514404296875, -2.0068359375, -1.499267578125, -0.99169921875, -0.484130859375, 0.0234375, 0.531005859375, 1.03857421875, 1.546142578125, 2.0537109375, 2.561279296875, 3.06884765625, 3.576416015625, 4.083984375, 4.591552734375, 5.09912109375, 5.606689453125, 6.1142578125, 6.621826171875, 7.12939453125, 7.636962890625, 8.14453125, 8.652099609375, 9.15966796875, 9.667236328125, 10.1748046875, 10.682373046875, 11.18994140625, 11.697509765625, 12.205078125, 12.712646484375, 13.22021484375, 13.727783203125, 14.2353515625, 14.742919921875, 15.25048828125, 15.758056640625, 16.265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 2.0, 7.0, 4.0, 8.0, 20.0, 20.0, 32.0, 35.0, 68.0, 119.0, 309.0, 864.0, 3189.0, 20390.0, 901895.0, 110172.0, 8674.0, 1710.0, 521.0, 214.0, 103.0, 63.0, 36.0, 29.0, 20.0, 17.0, 7.0, 3.0, 6.0, 4.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.744140625, -2.66046142578125, -2.5767822265625, -2.49310302734375, -2.409423828125, -2.32574462890625, -2.2420654296875, -2.15838623046875, -2.07470703125, -1.99102783203125, -1.9073486328125, -1.82366943359375, -1.739990234375, -1.65631103515625, -1.5726318359375, -1.48895263671875, -1.4052734375, -1.32159423828125, -1.2379150390625, -1.15423583984375, -1.070556640625, -0.98687744140625, -0.9031982421875, -0.81951904296875, -0.73583984375, -0.65216064453125, -0.5684814453125, -0.48480224609375, -0.401123046875, -0.31744384765625, -0.2337646484375, -0.15008544921875, -0.06640625, 0.01727294921875, 0.1009521484375, 0.18463134765625, 0.268310546875, 0.35198974609375, 0.4356689453125, 0.51934814453125, 0.60302734375, 0.68670654296875, 0.7703857421875, 0.85406494140625, 0.937744140625, 1.02142333984375, 1.1051025390625, 1.18878173828125, 1.2724609375, 1.35614013671875, 1.4398193359375, 1.52349853515625, 1.607177734375, 1.69085693359375, 1.7745361328125, 1.85821533203125, 1.94189453125, 2.02557373046875, 2.1092529296875, 2.19293212890625, 2.276611328125, 2.36029052734375, 2.4439697265625, 2.52764892578125, 2.611328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 5.0, 3.0, 5.0, 8.0, 5.0, 12.0, 11.0, 10.0, 18.0, 22.0, 44.0, 44.0, 79.0, 104.0, 129.0, 136.0, 103.0, 66.0, 46.0, 29.0, 23.0, 24.0, 20.0, 9.0, 10.0, 6.0, 7.0, 7.0, 5.0, 3.0, 5.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00034880638122558594, -0.0003336481750011444, -0.0003184899687767029, -0.00030333176255226135, -0.0002881735563278198, -0.0002730153501033783, -0.00025785714387893677, -0.00024269893765449524, -0.0002275407314300537, -0.00021238252520561218, -0.00019722431898117065, -0.00018206611275672913, -0.0001669079065322876, -0.00015174970030784607, -0.00013659149408340454, -0.00012143328785896301, -0.00010627508163452148, -9.111687541007996e-05, -7.595866918563843e-05, -6.08004629611969e-05, -4.564225673675537e-05, -3.0484050512313843e-05, -1.5325844287872314e-05, -1.6763806343078613e-07, 1.4990568161010742e-05, 3.014877438545227e-05, 4.53069806098938e-05, 6.046518683433533e-05, 7.562339305877686e-05, 9.078159928321838e-05, 0.00010593980550765991, 0.00012109801173210144, 0.00013625621795654297, 0.0001514144241809845, 0.00016657263040542603, 0.00018173083662986755, 0.00019688904285430908, 0.0002120472490787506, 0.00022720545530319214, 0.00024236366152763367, 0.0002575218677520752, 0.0002726800739765167, 0.00028783828020095825, 0.0003029964864253998, 0.0003181546926498413, 0.00033331289887428284, 0.00034847110509872437, 0.0003636293113231659, 0.0003787875175476074, 0.00039394572377204895, 0.0004091039299964905, 0.000424262136220932, 0.00043942034244537354, 0.00045457854866981506, 0.0004697367548942566, 0.0004848949611186981, 0.0005000531673431396, 0.0005152113735675812, 0.0005303695797920227, 0.0005455277860164642, 0.0005606859922409058, 0.0005758441984653473, 0.0005910024046897888, 0.0006061606109142303, 0.0006213188171386719]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 4.0, 5.0, 11.0, 7.0, 13.0, 12.0, 23.0, 41.0, 51.0, 82.0, 95.0, 118.0, 184.0, 307.0, 503.0, 777.0, 1389.0, 3056.0, 7645.0, 22502.0, 92795.0, 792550.0, 89881.0, 21996.0, 7654.0, 3099.0, 1453.0, 760.0, 504.0, 328.0, 205.0, 126.0, 94.0, 73.0, 54.0, 49.0, 26.0, 29.0, 11.0, 8.0, 8.0, 8.0, 4.0, 2.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.72320556640625, -0.6968994140625, -0.67059326171875, -0.644287109375, -0.61798095703125, -0.5916748046875, -0.56536865234375, -0.5390625, -0.51275634765625, -0.4864501953125, -0.46014404296875, -0.433837890625, -0.40753173828125, -0.3812255859375, -0.35491943359375, -0.32861328125, -0.30230712890625, -0.2760009765625, -0.24969482421875, -0.223388671875, -0.19708251953125, -0.1707763671875, -0.14447021484375, -0.1181640625, -0.09185791015625, -0.0655517578125, -0.03924560546875, -0.012939453125, 0.01336669921875, 0.0396728515625, 0.06597900390625, 0.09228515625, 0.11859130859375, 0.1448974609375, 0.17120361328125, 0.197509765625, 0.22381591796875, 0.2501220703125, 0.27642822265625, 0.302734375, 0.32904052734375, 0.3553466796875, 0.38165283203125, 0.407958984375, 0.43426513671875, 0.4605712890625, 0.48687744140625, 0.51318359375, 0.53948974609375, 0.5657958984375, 0.59210205078125, 0.618408203125, 0.64471435546875, 0.6710205078125, 0.69732666015625, 0.7236328125, 0.74993896484375, 0.7762451171875, 0.80255126953125, 0.828857421875, 0.85516357421875, 0.8814697265625, 0.90777587890625, 0.93408203125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 8.0, 8.0, 4.0, 7.0, 9.0, 9.0, 17.0, 22.0, 27.0, 22.0, 32.0, 54.0, 49.0, 64.0, 65.0, 77.0, 84.0, 77.0, 73.0, 63.0, 42.0, 31.0, 43.0, 16.0, 20.0, 10.0, 7.0, 9.0, 10.0, 9.0, 7.0, 8.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.1044921875, -1.0643310546875, -1.024169921875, -0.9840087890625, -0.94384765625, -0.9036865234375, -0.863525390625, -0.8233642578125, -0.783203125, -0.7430419921875, -0.702880859375, -0.6627197265625, -0.62255859375, -0.5823974609375, -0.542236328125, -0.5020751953125, -0.4619140625, -0.4217529296875, -0.381591796875, -0.3414306640625, -0.30126953125, -0.2611083984375, -0.220947265625, -0.1807861328125, -0.140625, -0.1004638671875, -0.060302734375, -0.0201416015625, 0.02001953125, 0.0601806640625, 0.100341796875, 0.1405029296875, 0.1806640625, 0.2208251953125, 0.260986328125, 0.3011474609375, 0.34130859375, 0.3814697265625, 0.421630859375, 0.4617919921875, 0.501953125, 0.5421142578125, 0.582275390625, 0.6224365234375, 0.66259765625, 0.7027587890625, 0.742919921875, 0.7830810546875, 0.8232421875, 0.8634033203125, 0.903564453125, 0.9437255859375, 0.98388671875, 1.0240478515625, 1.064208984375, 1.1043701171875, 1.14453125, 1.1846923828125, 1.224853515625, 1.2650146484375, 1.30517578125, 1.3453369140625, 1.385498046875, 1.4256591796875, 1.4658203125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 19.0, 49.0, 431.0, 368.0, 72.0, 31.0, 19.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.9377326965332, -53.136802673339844, -49.335872650146484, -45.534942626953125, -41.734012603759766, -37.933082580566406, -34.13215637207031, -30.33122444152832, -26.53029441833496, -22.7293643951416, -18.928434371948242, -15.1275053024292, -11.32657527923584, -7.525646209716797, -3.7247161865234375, 0.07621383666992188, 3.8771438598632812, 7.678073883056641, 11.47900390625, 15.279932975769043, 19.08086395263672, 22.881792068481445, 26.682722091674805, 30.483652114868164, 34.284584045410156, 38.085514068603516, 41.886444091796875, 45.687374114990234, 49.488304138183594, 53.28923034667969, 57.09016418457031, 60.891090393066406, 64.69202423095703, 68.49295043945312, 72.29388427734375, 76.09481048583984, 79.89574432373047, 83.69667053222656, 87.49760437011719, 91.29853057861328, 95.0994644165039, 98.900390625, 102.70132446289062, 106.50225067138672, 110.30318450927734, 114.10411071777344, 117.90504455566406, 121.70597076416016, 125.50689697265625, 129.30783081054688, 133.10874938964844, 136.90968322753906, 140.7106170654297, 144.5115509033203, 148.31246948242188, 152.1134033203125, 155.91433715820312, 159.71527099609375, 163.5161895751953, 167.31712341308594, 171.11805725097656, 174.9189910888672, 178.71990966796875, 182.52084350585938, 186.32177734375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 4.0, 5.0, 6.0, 6.0, 5.0, 20.0, 11.0, 23.0, 19.0, 20.0, 30.0, 28.0, 39.0, 54.0, 373.0, 125.0, 24.0, 43.0, 29.0, 22.0, 22.0, 17.0, 14.0, 9.0, 10.0, 10.0, 17.0, 2.0, 6.0, 4.0, 3.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.476261138916016, -41.784732818603516, -40.093204498291016, -38.401676177978516, -36.710147857666016, -35.018619537353516, -33.32709503173828, -31.63556480407715, -29.94403648376465, -28.25250816345215, -26.56097984313965, -24.86945343017578, -23.17792510986328, -21.48639678955078, -19.79486846923828, -18.10334014892578, -16.41181182861328, -14.720283508300781, -13.028755187988281, -11.337227821350098, -9.645699501037598, -7.954171180725098, -6.262643814086914, -4.571115493774414, -2.879587173461914, -1.1880590915679932, 0.5034689903259277, 2.1949968338012695, 3.8865251541137695, 5.5780534744262695, 7.269580841064453, 8.961109161376953, 10.652641296386719, 12.344169616699219, 14.035697937011719, 15.727225303649902, 17.41875457763672, 19.11028289794922, 20.801809310913086, 22.493337631225586, 24.184865951538086, 25.876394271850586, 27.567922592163086, 29.259449005126953, 30.950977325439453, 32.64250564575195, 34.33403396606445, 36.02556228637695, 37.71709060668945, 39.40861892700195, 41.10014724731445, 42.79167556762695, 44.48320388793945, 46.17473220825195, 47.86625671386719, 49.55778503417969, 51.24931335449219, 52.94084167480469, 54.63236999511719, 56.32389831542969, 58.01542663574219, 59.70695495605469, 61.39848327636719, 63.09001159667969, 64.78153991699219]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 4.0, 6.0, 7.0, 8.0, 16.0, 14.0, 15.0, 16.0, 18.0, 30.0, 33.0, 48.0, 55.0, 95.0, 258.0, 139.0, 50.0, 41.0, 34.0, 24.0, 16.0, 17.0, 11.0, 10.0, 12.0, 6.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.703125, -3.56976318359375, -3.4364013671875, -3.30303955078125, -3.169677734375, -3.03631591796875, -2.9029541015625, -2.76959228515625, -2.63623046875, -2.50286865234375, -2.3695068359375, -2.23614501953125, -2.102783203125, -1.96942138671875, -1.8360595703125, -1.70269775390625, -1.5693359375, -1.43597412109375, -1.3026123046875, -1.16925048828125, -1.035888671875, -0.90252685546875, -0.7691650390625, -0.63580322265625, -0.50244140625, -0.36907958984375, -0.2357177734375, -0.10235595703125, 0.031005859375, 0.16436767578125, 0.2977294921875, 0.43109130859375, 0.564453125, 0.69781494140625, 0.8311767578125, 0.96453857421875, 1.097900390625, 1.23126220703125, 1.3646240234375, 1.49798583984375, 1.63134765625, 1.76470947265625, 1.8980712890625, 2.03143310546875, 2.164794921875, 2.29815673828125, 2.4315185546875, 2.56488037109375, 2.6982421875, 2.83160400390625, 2.9649658203125, 3.09832763671875, 3.231689453125, 3.36505126953125, 3.4984130859375, 3.63177490234375, 3.76513671875, 3.89849853515625, 4.0318603515625, 4.16522216796875, 4.298583984375, 4.43194580078125, 4.5653076171875, 4.69866943359375, 4.83203125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 7.0, 24.0, 33.0, 51.0, 133.0, 579.0, 9302.0, 8374744.0, 3201.0, 304.0, 98.0, 39.0, 33.0, 9.0, 4.0, 3.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-77.78673553466797, -75.5217514038086, -73.25676727294922, -70.99178314208984, -68.72679138183594, -66.46180725097656, -64.19682312011719, -61.93183898925781, -59.66685485839844, -57.40187072753906, -55.13688659667969, -52.87189865112305, -50.60691452026367, -48.3419303894043, -46.076942443847656, -43.81195831298828, -41.546974182128906, -39.28199005126953, -37.017005920410156, -34.752017974853516, -32.48703384399414, -30.222049713134766, -27.957063674926758, -25.69207763671875, -23.427093505859375, -21.162109375, -18.897123336791992, -16.632137298583984, -14.36715316772461, -12.102168083190918, -9.837182998657227, -7.572197914123535, -5.307220458984375, -3.0422353744506836, -0.7772502899169922, 1.4877347946166992, 3.7527198791503906, 6.017704963684082, 8.282690048217773, 10.547675132751465, 12.812660217285156, 15.077645301818848, 17.34263038635254, 19.607616424560547, 21.872600555419922, 24.137584686279297, 26.402570724487305, 28.667556762695312, 30.932540893554688, 33.19752502441406, 35.46250915527344, 37.72749710083008, 39.99248123168945, 42.25746536254883, 44.52245330810547, 46.787437438964844, 49.05242156982422, 51.317405700683594, 53.58238983154297, 55.84737777709961, 58.112361907958984, 60.37734603881836, 62.642333984375, 64.90731811523438, 67.17230224609375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 2.0, 6.0, 6.0, 3.0, 4.0, 6.0, 4.0, 3.0, 1.0, 4.0, 2.0, 5.0, 1.0, 4.0, 3.0, 4.0, 2.0, 0.0, 7.0, 0.0, 0.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.220884323120117, -20.607982635498047, -19.99508285522461, -19.38218116760254, -18.76927947998047, -18.15637969970703, -17.54347801208496, -16.93057632446289, -16.317676544189453, -15.7047758102417, -15.091874122619629, -14.478973388671875, -13.866071701049805, -13.25317096710205, -12.640270233154297, -12.027368545532227, -11.414466857910156, -10.801566123962402, -10.188664436340332, -9.575763702392578, -8.962862014770508, -8.349961280822754, -7.737060546875, -7.124159336090088, -6.511258125305176, -5.898356914520264, -5.285455703735352, -4.672554969787598, -4.0596537590026855, -3.4467525482177734, -2.8338515758514404, -2.2209506034851074, -1.6080493927001953, -0.9951483011245728, -0.3822472095489502, 0.23065388202667236, 0.8435549736022949, 1.456456184387207, 2.06935715675354, 2.682258129119873, 3.295159339904785, 3.9080605506896973, 4.520961761474609, 5.133862495422363, 5.746763706207275, 6.3596649169921875, 6.972565650939941, 7.5854668617248535, 8.198368072509766, 8.81126880645752, 9.42417049407959, 10.037071228027344, 10.649972915649414, 11.262873649597168, 11.875774383544922, 12.488676071166992, 13.101576805114746, 13.7144775390625, 14.32737922668457, 14.940279960632324, 15.553180694580078, 16.16608238220215, 16.77898406982422, 17.391883850097656, 18.004785537719727]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 9.0, 8.0, 8.0, 11.0, 20.0, 35.0, 47.0, 74.0, 117.0, 174.0, 299.0, 640.0, 1410.0, 3687.0, 11275.0, 40398.0, 166286.0, 217643.0, 57444.0, 15788.0, 4995.0, 1946.0, 897.0, 394.0, 217.0, 132.0, 97.0, 66.0, 43.0, 26.0, 20.0, 15.0, 13.0, 9.0, 16.0, 1.0, 1.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.109375, -25.242431640625, -24.37548828125, -23.508544921875, -22.6416015625, -21.774658203125, -20.90771484375, -20.040771484375, -19.173828125, -18.306884765625, -17.43994140625, -16.572998046875, -15.7060546875, -14.839111328125, -13.97216796875, -13.105224609375, -12.23828125, -11.371337890625, -10.50439453125, -9.637451171875, -8.7705078125, -7.903564453125, -7.03662109375, -6.169677734375, -5.302734375, -4.435791015625, -3.56884765625, -2.701904296875, -1.8349609375, -0.968017578125, -0.10107421875, 0.765869140625, 1.6328125, 2.499755859375, 3.36669921875, 4.233642578125, 5.1005859375, 5.967529296875, 6.83447265625, 7.701416015625, 8.568359375, 9.435302734375, 10.30224609375, 11.169189453125, 12.0361328125, 12.903076171875, 13.77001953125, 14.636962890625, 15.50390625, 16.370849609375, 17.23779296875, 18.104736328125, 18.9716796875, 19.838623046875, 20.70556640625, 21.572509765625, 22.439453125, 23.306396484375, 24.17333984375, 25.040283203125, 25.9072265625, 26.774169921875, 27.64111328125, 28.508056640625, 29.375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 11.0, 9.0, 15.0, 21.0, 18.0, 34.0, 27.0, 37.0, 45.0, 68.0, 73.0, 82.0, 92.0, 83.0, 53.0, 65.0, 39.0, 50.0, 35.0, 30.0, 22.0, 11.0, 12.0, 3.0, 11.0, 13.0, 12.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.7890625, -4.644775390625, -4.50048828125, -4.356201171875, -4.2119140625, -4.067626953125, -3.92333984375, -3.779052734375, -3.634765625, -3.490478515625, -3.34619140625, -3.201904296875, -3.0576171875, -2.913330078125, -2.76904296875, -2.624755859375, -2.48046875, -2.336181640625, -2.19189453125, -2.047607421875, -1.9033203125, -1.759033203125, -1.61474609375, -1.470458984375, -1.326171875, -1.181884765625, -1.03759765625, -0.893310546875, -0.7490234375, -0.604736328125, -0.46044921875, -0.316162109375, -0.171875, -0.027587890625, 0.11669921875, 0.260986328125, 0.4052734375, 0.549560546875, 0.69384765625, 0.838134765625, 0.982421875, 1.126708984375, 1.27099609375, 1.415283203125, 1.5595703125, 1.703857421875, 1.84814453125, 1.992431640625, 2.13671875, 2.281005859375, 2.42529296875, 2.569580078125, 2.7138671875, 2.858154296875, 3.00244140625, 3.146728515625, 3.291015625, 3.435302734375, 3.57958984375, 3.723876953125, 3.8681640625, 4.012451171875, 4.15673828125, 4.301025390625, 4.4453125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 7.0, 21.0, 41.0, 51.0, 102.0, 68.0, 69.0, 44.0, 21.0, 11.0, 8.0, 4.0, 7.0, 2.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-27.620384216308594, -26.86237335205078, -26.104360580444336, -25.346349716186523, -24.588336944580078, -23.830326080322266, -23.072315216064453, -22.314302444458008, -21.556291580200195, -20.798280715942383, -20.040267944335938, -19.282257080078125, -18.52424430847168, -17.766233444213867, -17.008220672607422, -16.25020980834961, -15.49219799041748, -14.734186172485352, -13.976174354553223, -13.218162536621094, -12.460151672363281, -11.702139854431152, -10.944128036499023, -10.186117172241211, -9.428104400634766, -8.670092582702637, -7.912081241607666, -7.154069423675537, -6.396058082580566, -5.6380462646484375, -4.880034446716309, -4.122023105621338, -3.364011764526367, -2.6060001850128174, -1.847988486289978, -1.0899767875671387, -0.33196520805358887, 0.42604637145996094, 1.1840581893920898, 1.9420695304870605, 2.7000813484191895, 3.4580929279327393, 4.216104507446289, 4.974116325378418, 5.732128143310547, 6.490139484405518, 7.2481513023376465, 8.006162643432617, 8.764174461364746, 9.522186279296875, 10.280198097229004, 11.038209915161133, 11.796220779418945, 12.554232597351074, 13.312244415283203, 14.070255279541016, 14.828268051147461, 15.58627986907959, 16.34429168701172, 17.10230255126953, 17.860315322875977, 18.61832618713379, 19.376338958740234, 20.134349822998047, 20.89236068725586]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 8.0, 5.0, 4.0, 4.0, 3.0, 10.0, 21.0, 38.0, 72.0, 76.0, 89.0, 55.0, 25.0, 11.0, 6.0, 4.0, 3.0, 5.0, 4.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-17.023977279663086, -16.454936981201172, -15.885895729064941, -15.316854476928711, -14.747814178466797, -14.178773880004883, -13.609732627868652, -13.040691375732422, -12.471651077270508, -11.902610778808594, -11.333569526672363, -10.764528274536133, -10.195487976074219, -9.626447677612305, -9.057406425476074, -8.488365173339844, -7.91932487487793, -7.350284099578857, -6.781243324279785, -6.212202548980713, -5.643161773681641, -5.074120998382568, -4.505080223083496, -3.936039447784424, -3.3669986724853516, -2.7979578971862793, -2.228917121887207, -1.6598763465881348, -1.0908355712890625, -0.5217947959899902, 0.04724597930908203, 0.6162867546081543, 1.1853275299072266, 1.7543683052062988, 2.323409080505371, 2.8924498558044434, 3.4614906311035156, 4.030531406402588, 4.59957218170166, 5.168612957000732, 5.737653732299805, 6.306694507598877, 6.875735282897949, 7.4447760581970215, 8.013816833496094, 8.582857131958008, 9.151898384094238, 9.720939636230469, 10.289979934692383, 10.859020233154297, 11.428061485290527, 11.997102737426758, 12.566143035888672, 13.135183334350586, 13.704224586486816, 14.273265838623047, 14.842306137084961, 15.411346435546875, 15.980387687683105, 16.549428939819336, 17.11846923828125, 17.687509536743164, 18.256549835205078, 18.825592041015625, 19.39463233947754]}, "_wandb": {"runtime": 2352}} \ No newline at end of file